{ "schemaVersion": 1, "deviceProperties": [ { "id": 0, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 1, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 2, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 3, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 4, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 5, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 6, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 7, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 } ], "cupti_version": 22, "cuda_runtime_version": 12040, "cuda_driver_version": 12080, "distributedInfo": {"backend": "nccl", "rank": 6, "world_size": 8, "pg_count": 1, "pg_config": [{"pg_name": "0", "pg_desc": "default_pg", "backend_config": "cuda:nccl", "pg_size": 8, "ranks": [0, 1, 2, 3, 4, 5, 6, 7]}], "nccl_version": "2.21.5"}, "record_shapes": 1, "trace_id": "95763B3072364D998E59D026E27F441D", "traceEvents": [ { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: DivBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650730337.873, "dur": 114.218, "args": { "External id": 17409,"Record function id": 0, "Sequence number": 246770, "Fwd thread id": 1, "Ev Idx": 0 } }, { "ph": "X", "cat": "cpu_op", "name": "DivBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650730357.936, "dur": 85.190, "args": { "External id": 17410,"Sequence number": 246770, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 1 } }, { "ph": "f", "id": 1, "pid": 1336759, "tid": 1381173, "ts": 1295650730357.936, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 1336759, "tid": 1381173, "ts": 1295650730366.749, "dur": 74.093, "args": { "External id": 17411,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 2 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650730466.908, "dur": 202.571, "args": { "External id": 17412,"Record function id": 0, "Ev Idx": 3 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650730521.861, "dur": 84.536, "args": { "External id": 17413,"Record function id": 0, "Ev Idx": 4 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.27", "pid": 1336759, "tid": 1381173, "ts": 1295650730549.378, "dur": 44.417, "args": { "External id": 17414,"Record function id": 0, "Ev Idx": 5 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650730611.542, "dur": 1.764, "args": { "External id": 17415,"Sequence number": 246769, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 6 } }, { "ph": "f", "id": 2, "pid": 1336759, "tid": 1381173, "ts": 1295650730611.542, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1381173, "ts": 1295650730617.237, "dur": 47.975, "args": { "External id": 17416,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 7 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1381173, "ts": 1295650730625.735, "dur": 38.928, "args": { "External id": 17417,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 8 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650730634.216, "dur": 2.412, "args": { "External id": 17418,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650730677.386, "dur": 36995.928, "args": { "External id": 17419,"Record function id": 0, "Sequence number": 246767, "Fwd thread id": 1, "Ev Idx": 10 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650730679.021, "dur": 36982.963, "args": { "External id": 17420,"Sequence number": 246767, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11 } }, { "ph": "f", "id": 3, "pid": 1336759, "tid": 1381173, "ts": 1295650730679.021, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650730717.809, "dur": 4.361, "args": { "External id": 17421,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 12 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295650730724.954, "dur": 36828.127, "args": { "External id": 17422,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 13 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295650730729.637, "dur": 36823.087, "args": { "External id": 17423,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 14 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650730733.591, "dur": 5.922, "args": { "External id": 17424,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 15 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650730741.207, "dur": 36809.961, "args": { "External id": 17425,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 16 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 1336759, "tid": 1381173, "ts": 1295650767558.195, "dur": 0.579, "args": { "External id": 17426,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 17 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 1336759, "tid": 1381173, "ts": 1295650767561.133, "dur": 3.486, "args": { "External id": 17427,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 18 } }, { "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 1336759, "tid": 1381173, "ts": 1295650767563.277, "dur": 1.193, "args": { "External id": 17428,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 19 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336759, "tid": 1381173, "ts": 1295650767570.678, "dur": 30.038, "args": { "External id": 17429,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 20 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336759, "tid": 1381173, "ts": 1295650767609.145, "dur": 43.687, "args": { "External id": 17430,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 21 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336759, "tid": 1381173, "ts": 1295650767610.867, "dur": 41.745, "args": { "External id": 17431,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 22 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336759, "tid": 1381173, "ts": 1295650767612.533, "dur": 39.849, "args": { "External id": 17432,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 23 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650767683.450, "dur": 15.749, "args": { "External id": 17433,"Record function id": 0, "Sequence number": 246766, "Fwd thread id": 1, "Ev Idx": 24 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650767685.313, "dur": 11.203, "args": { "External id": 17434,"Sequence number": 246766, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 25 } }, { "ph": "f", "id": 4, "pid": 1336759, "tid": 1381173, "ts": 1295650767685.313, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650767689.130, "dur": 7.163, "args": { "External id": 17435,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 26 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650767691.375, "dur": 4.722, "args": { "External id": 17436,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 27 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650767703.139, "dur": 91.230, "args": { "External id": 17437,"Record function id": 0, "Sequence number": 246765, "Fwd thread id": 1, "Ev Idx": 28 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650767704.178, "dur": 83.812, "args": { "External id": 17438,"Sequence number": 246765, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 29 } }, { "ph": "f", "id": 5, "pid": 1336759, "tid": 1381173, "ts": 1295650767704.178, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650767708.719, "dur": 78.641, "args": { "External id": 17439,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 30 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1381173, "ts": 1295650767714.899, "dur": 31.358, "args": { "External id": 17440,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 31 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650767717.499, "dur": 4.760, "args": { "External id": 17441,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 32 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1381173, "ts": 1295650767723.944, "dur": 22.026, "args": { "External id": 17442,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 33 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1381173, "ts": 1295650767728.028, "dur": 17.387, "args": { "External id": 17443,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 34 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295650767748.648, "dur": 5.902, "args": { "External id": 17444,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 35 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650767752.716, "dur": 1.400, "args": { "External id": 17445,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[8388608, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 36 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650767755.689, "dur": 30.818, "args": { "External id": 17446,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 37 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650767799.516, "dur": 59.514, "args": { "External id": 17447,"Record function id": 0, "Sequence number": 246764, "Fwd thread id": 1, "Ev Idx": 38 } }, { "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650767800.596, "dur": 55.418, "args": { "External id": 17448,"Sequence number": 246764, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 39 } }, { "ph": "f", "id": 6, "pid": 1336759, "tid": 1381173, "ts": 1295650767800.596, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650767804.412, "dur": 51.324, "args": { "External id": 17449,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "2", "3"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 40 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1381173, "ts": 1295650767808.456, "dur": 18.823, "args": { "External id": 17450,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 41 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650767809.944, "dur": 3.026, "args": { "External id": 17451,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 42 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1381173, "ts": 1295650767813.687, "dur": 13.332, "args": { "External id": 17452,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 43 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1381173, "ts": 1295650767815.452, "dur": 11.137, "args": { "External id": 17453,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 44 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336759, "tid": 1381173, "ts": 1295650767831.453, "dur": 6.554, "args": { "External id": 17454,"Record function id": 0, "Concrete Inputs": ["", "2", "3"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 45 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650767836.443, "dur": 0.851, "args": { "External id": 17455,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "6144"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 46 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650767838.716, "dur": 16.503, "args": { "External id": 17456,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 47 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650767863.297, "dur": 110.256, "args": { "External id": 17457,"Record function id": 0, "Sequence number": 246763, "Fwd thread id": 1, "Ev Idx": 48 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650767864.324, "dur": 105.884, "args": { "External id": 17458,"Sequence number": 246763, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 49 } }, { "ph": "f", "id": 7, "pid": 1336759, "tid": 1381173, "ts": 1295650767864.324, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650767866.131, "dur": 103.626, "args": { "External id": 17459,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 50 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1381173, "ts": 1295650767870.058, "dur": 14.935, "args": { "External id": 17460,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 51 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650767871.089, "dur": 2.089, "args": { "External id": 17461,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 52 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1381173, "ts": 1295650767873.949, "dur": 10.790, "args": { "External id": 17462,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 53 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1381173, "ts": 1295650767874.736, "dur": 9.644, "args": { "External id": 17463,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 54 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295650767888.511, "dur": 3.055, "args": { "External id": 17464,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 55 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650767890.542, "dur": 0.855, "args": { "External id": 17465,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 56 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650767892.245, "dur": 76.677, "args": { "External id": 17466,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 57 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650767980.559, "dur": 126.262, "args": { "External id": 17467,"Record function id": 0, "Sequence number": 246762, "Fwd thread id": 1, "Ev Idx": 58 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650768010.422, "dur": 92.577, "args": { "External id": 17468,"Sequence number": 246762, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 59 } }, { "ph": "f", "id": 8, "pid": 1336759, "tid": 1381173, "ts": 1295650768010.422, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650768012.802, "dur": 89.890, "args": { "External id": 17469,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 60 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1381173, "ts": 1295650768014.611, "dur": 22.892, "args": { "External id": 17470,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 61 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650768015.967, "dur": 4.530, "args": { "External id": 17471,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 62 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1381173, "ts": 1295650768021.402, "dur": 15.848, "args": { "External id": 17472,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 63 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1381173, "ts": 1295650768022.329, "dur": 14.513, "args": { "External id": 17473,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 64 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295650768040.904, "dur": 4.813, "args": { "External id": 17474,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 65 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650768044.874, "dur": 0.601, "args": { "External id": 17475,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 66 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650768046.568, "dur": 55.432, "args": { "External id": 17476,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 67 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650768112.689, "dur": 33.534, "args": { "External id": 17477,"Record function id": 0, "Sequence number": 246761, "Fwd thread id": 1, "Ev Idx": 68 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650768114.098, "dur": 0.948, "args": { "External id": 17478,"Sequence number": 246761, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 69 } }, { "ph": "f", "id": 9, "pid": 1336759, "tid": 1381173, "ts": 1295650768114.098, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1381173, "ts": 1295650768117.741, "dur": 25.198, "args": { "External id": 17479,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 70 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1381173, "ts": 1295650768119.771, "dur": 22.671, "args": { "External id": 17480,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 71 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650768126.453, "dur": 0.492, "args": { "External id": 17481,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 72 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650768150.882, "dur": 2271.322, "args": { "External id": 17482,"Record function id": 0, "Sequence number": 246759, "Fwd thread id": 1, "Ev Idx": 73 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650768152.534, "dur": 2238.950, "args": { "External id": 17483,"Sequence number": 246759, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 74 } }, { "ph": "f", "id": 10, "pid": 1336759, "tid": 1381173, "ts": 1295650768152.534, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650768190.692, "dur": 3.470, "args": { "External id": 17484,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 75 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295650768196.526, "dur": 2103.795, "args": { "External id": 17485,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 76 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295650768198.417, "dur": 2101.563, "args": { "External id": 17486,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 77 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650768201.573, "dur": 4.006, "args": { "External id": 17487,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 78 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650768208.884, "dur": 2090.062, "args": { "External id": 17488,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 79 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 1336759, "tid": 1381173, "ts": 1295650770304.762, "dur": 0.463, "args": { "External id": 17489,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 80 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 1336759, "tid": 1381173, "ts": 1295650770306.826, "dur": 2.914, "args": { "External id": 17490,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 81 } }, { "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 1336759, "tid": 1381173, "ts": 1295650770308.611, "dur": 1.008, "args": { "External id": 17491,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 82 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336759, "tid": 1381173, "ts": 1295650770314.025, "dur": 22.908, "args": { "External id": 17492,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 83 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336759, "tid": 1381173, "ts": 1295650770343.002, "dur": 40.904, "args": { "External id": 17493,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 84 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336759, "tid": 1381173, "ts": 1295650770344.298, "dur": 39.440, "args": { "External id": 17494,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 85 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336759, "tid": 1381173, "ts": 1295650770345.892, "dur": 37.537, "args": { "External id": 17495,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 86 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1381173, "ts": 1295650770400.126, "dur": 18.686, "args": { "External id": 17496,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 87 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650770430.345, "dur": 14.127, "args": { "External id": 17497,"Record function id": 0, "Sequence number": 246758, "Fwd thread id": 1, "Ev Idx": 88 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650770433.618, "dur": 8.736, "args": { "External id": 17498,"Sequence number": 246758, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 89 } }, { "ph": "f", "id": 11, "pid": 1336759, "tid": 1381173, "ts": 1295650770433.618, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650770436.479, "dur": 5.686, "args": { "External id": 17499,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 90 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650770438.415, "dur": 3.576, "args": { "External id": 17500,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 91 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650770448.408, "dur": 62.158, "args": { "External id": 17501,"Record function id": 0, "Sequence number": 246757, "Fwd thread id": 1, "Ev Idx": 92 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650770449.309, "dur": 56.854, "args": { "External id": 17502,"Sequence number": 246757, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 93 } }, { "ph": "f", "id": 12, "pid": 1336759, "tid": 1381173, "ts": 1295650770449.309, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650770451.310, "dur": 54.349, "args": { "External id": 17503,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 94 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1381173, "ts": 1295650770454.006, "dur": 18.772, "args": { "External id": 17504,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 95 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650770455.952, "dur": 2.767, "args": { "External id": 17505,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 96 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1381173, "ts": 1295650770459.490, "dur": 13.055, "args": { "External id": 17506,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 97 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1381173, "ts": 1295650770460.710, "dur": 11.488, "args": { "External id": 17507,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 98 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295650770474.064, "dur": 4.631, "args": { "External id": 17508,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 99 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650770476.415, "dur": 1.981, "args": { "External id": 17509,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[8388608, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650770481.613, "dur": 23.321, "args": { "External id": 17510,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 101 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650770514.587, "dur": 53.344, "args": { "External id": 17511,"Record function id": 0, "Sequence number": 246756, "Fwd thread id": 1, "Ev Idx": 102 } }, { "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650770515.414, "dur": 49.995, "args": { "External id": 17512,"Sequence number": 246756, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 103 } }, { "ph": "f", "id": 13, "pid": 1336759, "tid": 1381173, "ts": 1295650770515.414, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650770517.811, "dur": 47.330, "args": { "External id": 17513,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "2", "2"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1381173, "ts": 1295650770519.723, "dur": 22.085, "args": { "External id": 17514,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650770520.855, "dur": 2.641, "args": { "External id": 17515,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1381173, "ts": 1295650770524.306, "dur": 17.232, "args": { "External id": 17516,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1381173, "ts": 1295650770525.068, "dur": 16.052, "args": { "External id": 17517,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336759, "tid": 1381173, "ts": 1295650770543.128, "dur": 7.186, "args": { "External id": 17518,"Record function id": 0, "Concrete Inputs": ["", "2", "2"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650770548.859, "dur": 0.876, "args": { "External id": 17519,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "4096"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650770550.985, "dur": 13.623, "args": { "External id": 17520,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 111 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650770571.878, "dur": 93.505, "args": { "External id": 17521,"Record function id": 0, "Sequence number": 246755, "Fwd thread id": 1, "Ev Idx": 112 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650770573.081, "dur": 89.528, "args": { "External id": 17522,"Sequence number": 246755, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 113 } }, { "ph": "f", "id": 14, "pid": 1336759, "tid": 1381173, "ts": 1295650770573.081, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650770574.824, "dur": 87.489, "args": { "External id": 17523,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1381173, "ts": 1295650770576.111, "dur": 15.176, "args": { "External id": 17524,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650770577.619, "dur": 2.221, "args": { "External id": 17525,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1381173, "ts": 1295650770580.355, "dur": 10.672, "args": { "External id": 17526,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1381173, "ts": 1295650770581.618, "dur": 9.102, "args": { "External id": 17527,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295650770592.142, "dur": 5.216, "args": { "External id": 17528,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650770596.280, "dur": 0.904, "args": { "External id": 17529,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650770598.036, "dur": 63.599, "args": { "External id": 17530,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 121 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650770671.664, "dur": 87.559, "args": { "External id": 17531,"Record function id": 0, "Sequence number": 246754, "Fwd thread id": 1, "Ev Idx": 122 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650770672.618, "dur": 68.645, "args": { "External id": 17532,"Sequence number": 246754, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 123 } }, { "ph": "f", "id": 15, "pid": 1336759, "tid": 1381173, "ts": 1295650770672.618, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650770674.271, "dur": 66.719, "args": { "External id": 17533,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1381173, "ts": 1295650770675.351, "dur": 14.371, "args": { "External id": 17534,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650770676.098, "dur": 1.830, "args": { "External id": 17535,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1381173, "ts": 1295650770678.665, "dur": 10.793, "args": { "External id": 17536,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1381173, "ts": 1295650770679.344, "dur": 9.799, "args": { "External id": 17537,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295650770690.678, "dur": 2.632, "args": { "External id": 17538,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650770692.693, "dur": 0.442, "args": { "External id": 17539,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650770694.067, "dur": 46.307, "args": { "External id": 17540,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1381173, "ts": 1295650770744.281, "dur": 13.656, "args": { "External id": 17541,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 132 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650770765.732, "dur": 28.684, "args": { "External id": 17542,"Record function id": 0, "Sequence number": 246753, "Fwd thread id": 1, "Ev Idx": 133 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650770766.733, "dur": 0.720, "args": { "External id": 17543,"Sequence number": 246753, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 134 } }, { "ph": "f", "id": 16, "pid": 1336759, "tid": 1381173, "ts": 1295650770766.733, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1381173, "ts": 1295650770769.423, "dur": 22.296, "args": { "External id": 17544,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1381173, "ts": 1295650770771.046, "dur": 20.228, "args": { "External id": 17545,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650770775.342, "dur": 1.626, "args": { "External id": 17546,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 137 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650770798.407, "dur": 3123.232, "args": { "External id": 17547,"Record function id": 0, "Sequence number": 246751, "Fwd thread id": 1, "Ev Idx": 138 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650770801.963, "dur": 3096.534, "args": { "External id": 17548,"Sequence number": 246751, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 139 } }, { "ph": "f", "id": 17, "pid": 1336759, "tid": 1381173, "ts": 1295650770801.963, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650770829.960, "dur": 2.229, "args": { "External id": 17549,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295650770834.084, "dur": 2979.200, "args": { "External id": 17550,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295650770835.402, "dur": 2977.457, "args": { "External id": 17551,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650770837.889, "dur": 4.240, "args": { "External id": 17552,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650770843.229, "dur": 2968.572, "args": { "External id": 17553,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 1336759, "tid": 1381173, "ts": 1295650773817.193, "dur": 0.347, "args": { "External id": 17554,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 1336759, "tid": 1381173, "ts": 1295650773819.137, "dur": 4.392, "args": { "External id": 17555,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 146 } }, { "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 1336759, "tid": 1381173, "ts": 1295650773822.634, "dur": 0.768, "args": { "External id": 17556,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336759, "tid": 1381173, "ts": 1295650773827.362, "dur": 20.531, "args": { "External id": 17557,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336759, "tid": 1381173, "ts": 1295650773852.794, "dur": 38.484, "args": { "External id": 17558,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336759, "tid": 1381173, "ts": 1295650773854.367, "dur": 36.731, "args": { "External id": 17559,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336759, "tid": 1381173, "ts": 1295650773855.496, "dur": 35.253, "args": { "External id": 17560,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1381173, "ts": 1295650773905.659, "dur": 13.132, "args": { "External id": 17561,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 152 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650773931.854, "dur": 11.098, "args": { "External id": 17562,"Record function id": 0, "Sequence number": 246750, "Fwd thread id": 1, "Ev Idx": 153 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650773933.367, "dur": 7.682, "args": { "External id": 17563,"Sequence number": 246750, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 154 } }, { "ph": "f", "id": 18, "pid": 1336759, "tid": 1381173, "ts": 1295650773933.367, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650773936.007, "dur": 4.833, "args": { "External id": 17564,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650773937.980, "dur": 2.752, "args": { "External id": 17565,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 156 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650773946.230, "dur": 89.595, "args": { "External id": 17566,"Record function id": 0, "Sequence number": 246749, "Fwd thread id": 1, "Ev Idx": 157 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650773949.707, "dur": 80.628, "args": { "External id": 17567,"Sequence number": 246749, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 158 } }, { "ph": "f", "id": 19, "pid": 1336759, "tid": 1381173, "ts": 1295650773949.707, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650773951.660, "dur": 78.200, "args": { "External id": 17568,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1381173, "ts": 1295650773954.271, "dur": 19.675, "args": { "External id": 17569,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650773956.330, "dur": 2.572, "args": { "External id": 17570,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1381173, "ts": 1295650773959.740, "dur": 13.940, "args": { "External id": 17571,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1381173, "ts": 1295650773961.185, "dur": 12.061, "args": { "External id": 17572,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295650773975.399, "dur": 3.716, "args": { "External id": 17573,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650773978.159, "dur": 0.679, "args": { "External id": 17574,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[8388608, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650773980.240, "dur": 48.389, "args": { "External id": 17575,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 166 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650774041.608, "dur": 51.077, "args": { "External id": 17576,"Record function id": 0, "Sequence number": 246748, "Fwd thread id": 1, "Ev Idx": 167 } }, { "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650774042.991, "dur": 47.094, "args": { "External id": 17577,"Sequence number": 246748, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 168 } }, { "ph": "f", "id": 20, "pid": 1336759, "tid": 1381173, "ts": 1295650774042.991, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650774045.507, "dur": 44.348, "args": { "External id": 17578,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "2", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1381173, "ts": 1295650774049.654, "dur": 17.000, "args": { "External id": 17579,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650774050.977, "dur": 2.840, "args": { "External id": 17580,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1381173, "ts": 1295650774054.432, "dur": 11.984, "args": { "External id": 17581,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1381173, "ts": 1295650774055.126, "dur": 10.967, "args": { "External id": 17582,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336759, "tid": 1381173, "ts": 1295650774067.746, "dur": 7.116, "args": { "External id": 17583,"Record function id": 0, "Concrete Inputs": ["", "2", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650774071.986, "dur": 2.421, "args": { "External id": 17584,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 175 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650774075.818, "dur": 13.482, "args": { "External id": 17585,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 176 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650774096.478, "dur": 92.173, "args": { "External id": 17586,"Record function id": 0, "Sequence number": 246747, "Fwd thread id": 1, "Ev Idx": 177 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650774097.453, "dur": 88.628, "args": { "External id": 17587,"Sequence number": 246747, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 178 } }, { "ph": "f", "id": 21, "pid": 1336759, "tid": 1381173, "ts": 1295650774097.453, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650774099.119, "dur": 86.553, "args": { "External id": 17588,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1381173, "ts": 1295650774100.184, "dur": 25.188, "args": { "External id": 17589,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650774103.500, "dur": 2.031, "args": { "External id": 17590,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1381173, "ts": 1295650774106.157, "dur": 18.945, "args": { "External id": 17591,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1381173, "ts": 1295650774106.594, "dur": 18.125, "args": { "External id": 17592,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295650774126.426, "dur": 2.950, "args": { "External id": 17593,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650774128.423, "dur": 0.713, "args": { "External id": 17594,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650774129.939, "dur": 54.989, "args": { "External id": 17595,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 186 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650774192.350, "dur": 102.868, "args": { "External id": 17596,"Record function id": 0, "Sequence number": 246746, "Fwd thread id": 1, "Ev Idx": 187 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650774193.406, "dur": 84.047, "args": { "External id": 17597,"Sequence number": 246746, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 188 } }, { "ph": "f", "id": 22, "pid": 1336759, "tid": 1381173, "ts": 1295650774193.406, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650774197.245, "dur": 79.901, "args": { "External id": 17598,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1381173, "ts": 1295650774198.397, "dur": 15.419, "args": { "External id": 17599,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650774201.432, "dur": 1.681, "args": { "External id": 17600,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1381173, "ts": 1295650774203.604, "dur": 9.951, "args": { "External id": 17601,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1381173, "ts": 1295650774204.303, "dur": 8.945, "args": { "External id": 17602,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295650774214.638, "dur": 2.799, "args": { "External id": 17603,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650774216.413, "dur": 0.858, "args": { "External id": 17604,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650774217.944, "dur": 58.227, "args": { "External id": 17605,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1381173, "ts": 1295650774282.027, "dur": 12.062, "args": { "External id": 17606,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 197 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650774300.675, "dur": 28.710, "args": { "External id": 17607,"Record function id": 0, "Sequence number": 246745, "Fwd thread id": 1, "Ev Idx": 198 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650774301.672, "dur": 1.003, "args": { "External id": 17608,"Sequence number": 246745, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 199 } }, { "ph": "f", "id": 23, "pid": 1336759, "tid": 1381173, "ts": 1295650774301.672, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1381173, "ts": 1295650774304.224, "dur": 21.247, "args": { "External id": 17609,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1381173, "ts": 1295650774305.906, "dur": 19.089, "args": { "External id": 17610,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650774310.506, "dur": 0.560, "args": { "External id": 17611,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 202 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650774333.304, "dur": 3092.850, "args": { "External id": 17612,"Record function id": 0, "Sequence number": 246744, "Fwd thread id": 1, "Ev Idx": 203 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650774344.967, "dur": 3052.924, "args": { "External id": 17613,"Sequence number": 246744, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 204 } }, { "ph": "f", "id": 24, "pid": 1336759, "tid": 1381173, "ts": 1295650774344.967, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650774372.527, "dur": 2.743, "args": { "External id": 17614,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295650774377.592, "dur": 2935.385, "args": { "External id": 17615,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295650774378.872, "dur": 2933.715, "args": { "External id": 17616,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650774381.768, "dur": 3.122, "args": { "External id": 17617,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650774385.890, "dur": 2925.685, "args": { "External id": 17618,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 1336759, "tid": 1381173, "ts": 1295650777315.963, "dur": 0.333, "args": { "External id": 17619,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 1336759, "tid": 1381173, "ts": 1295650777317.312, "dur": 2.058, "args": { "External id": 17620,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 211 } }, { "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 1336759, "tid": 1381173, "ts": 1295650777318.596, "dur": 0.664, "args": { "External id": 17621,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336759, "tid": 1381173, "ts": 1295650777322.687, "dur": 20.854, "args": { "External id": 17622,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336759, "tid": 1381173, "ts": 1295650777348.406, "dur": 42.792, "args": { "External id": 17623,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336759, "tid": 1381173, "ts": 1295650777349.296, "dur": 41.689, "args": { "External id": 17624,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336759, "tid": 1381173, "ts": 1295650777350.561, "dur": 40.096, "args": { "External id": 17625,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1381173, "ts": 1295650777407.517, "dur": 13.928, "args": { "External id": 17626,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 217 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650777439.547, "dur": 12.624, "args": { "External id": 17627,"Record function id": 0, "Ev Idx": 218 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650777442.235, "dur": 7.964, "args": { "External id": 17628,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650777445.167, "dur": 3.997, "args": { "External id": 17629,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 220 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650777445.954, "dur": 3.111, "args": { "External id": 17630,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 221 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650777455.845, "dur": 10.169, "args": { "External id": 17631,"Record function id": 0, "Sequence number": 246743, "Fwd thread id": 1, "Ev Idx": 222 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650777456.925, "dur": 6.842, "args": { "External id": 17632,"Sequence number": 246743, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 223 } }, { "ph": "f", "id": 25, "pid": 1336759, "tid": 1381173, "ts": 1295650777456.925, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650777459.551, "dur": 4.019, "args": { "External id": 17633,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650777460.874, "dur": 2.593, "args": { "External id": 17634,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 225 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650777469.360, "dur": 60.935, "args": { "External id": 17635,"Record function id": 0, "Sequence number": 246742, "Fwd thread id": 1, "Ev Idx": 226 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650777472.314, "dur": 53.894, "args": { "External id": 17636,"Sequence number": 246742, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 227 } }, { "ph": "f", "id": 26, "pid": 1336759, "tid": 1381173, "ts": 1295650777472.314, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650777474.182, "dur": 51.653, "args": { "External id": 17637,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1381173, "ts": 1295650777476.733, "dur": 20.388, "args": { "External id": 17638,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650777478.643, "dur": 2.527, "args": { "External id": 17639,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1381173, "ts": 1295650777482.324, "dur": 14.462, "args": { "External id": 17640,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1381173, "ts": 1295650777484.146, "dur": 12.083, "args": { "External id": 17641,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295650777498.674, "dur": 4.084, "args": { "External id": 17642,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650777501.722, "dur": 0.789, "args": { "External id": 17643,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[8388608, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650777503.828, "dur": 21.251, "args": { "External id": 17644,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 235 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650777537.017, "dur": 47.178, "args": { "External id": 17645,"Record function id": 0, "Sequence number": 246741, "Fwd thread id": 1, "Ev Idx": 236 } }, { "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650777538.073, "dur": 43.664, "args": { "External id": 17646,"Sequence number": 246741, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 237 } }, { "ph": "f", "id": 27, "pid": 1336759, "tid": 1381173, "ts": 1295650777538.073, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650777540.138, "dur": 41.342, "args": { "External id": 17647,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "2", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1381173, "ts": 1295650777543.670, "dur": 16.787, "args": { "External id": 17648,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650777544.744, "dur": 2.173, "args": { "External id": 17649,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1381173, "ts": 1295650777547.449, "dur": 12.760, "args": { "External id": 17650,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1381173, "ts": 1295650777548.333, "dur": 11.543, "args": { "External id": 17651,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336759, "tid": 1381173, "ts": 1295650777561.742, "dur": 5.209, "args": { "External id": 17652,"Record function id": 0, "Concrete Inputs": ["", "2", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650777565.595, "dur": 0.822, "args": { "External id": 17653,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650777567.869, "dur": 13.038, "args": { "External id": 17654,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 245 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650777588.082, "dur": 92.979, "args": { "External id": 17655,"Record function id": 0, "Sequence number": 246740, "Fwd thread id": 1, "Ev Idx": 246 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650777588.904, "dur": 89.660, "args": { "External id": 17656,"Sequence number": 246740, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 247 } }, { "ph": "f", "id": 28, "pid": 1336759, "tid": 1381173, "ts": 1295650777588.904, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650777590.378, "dur": 87.823, "args": { "External id": 17657,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1381173, "ts": 1295650777593.938, "dur": 16.962, "args": { "External id": 17658,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650777597.587, "dur": 2.034, "args": { "External id": 17659,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1381173, "ts": 1295650777600.366, "dur": 10.281, "args": { "External id": 17660,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1381173, "ts": 1295650777601.381, "dur": 8.967, "args": { "External id": 17661,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295650777611.757, "dur": 3.646, "args": { "External id": 17662,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650777613.455, "dur": 1.758, "args": { "External id": 17663,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650777616.057, "dur": 61.337, "args": { "External id": 17664,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 255 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650777684.710, "dur": 99.239, "args": { "External id": 17665,"Record function id": 0, "Sequence number": 246739, "Fwd thread id": 1, "Ev Idx": 256 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650777685.496, "dur": 82.428, "args": { "External id": 17666,"Sequence number": 246739, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 257 } }, { "ph": "f", "id": 29, "pid": 1336759, "tid": 1381173, "ts": 1295650777685.496, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650777687.055, "dur": 80.588, "args": { "External id": 17667,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1381173, "ts": 1295650777688.159, "dur": 22.541, "args": { "External id": 17668,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650777691.980, "dur": 1.749, "args": { "External id": 17669,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1381173, "ts": 1295650777697.552, "dur": 12.856, "args": { "External id": 17670,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1381173, "ts": 1295650777699.795, "dur": 10.239, "args": { "External id": 17671,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295650777711.431, "dur": 4.589, "args": { "External id": 17672,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650777715.347, "dur": 0.499, "args": { "External id": 17673,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650777716.576, "dur": 50.431, "args": { "External id": 17674,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1381173, "ts": 1295650777771.278, "dur": 11.009, "args": { "External id": 17675,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 266 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650777789.486, "dur": 349.793, "args": { "External id": 17676,"Record function id": 0, "Sequence number": 246738, "Fwd thread id": 1, "Ev Idx": 267 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650777791.018, "dur": 339.719, "args": { "External id": 17677,"Sequence number": 246738, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 268 } }, { "ph": "f", "id": 30, "pid": 1336759, "tid": 1381173, "ts": 1295650777791.018, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295650777937.049, "dur": 40.014, "args": { "External id": 17678,"kernel_hash": "cntjjtfhvxdzpnscrpib2i3ct2hk6s7qd3lqykazlircwdkp676d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "262144", "2048", "1", "1986", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/nt/cntjjtfhvxdzpnscrpib2i3ct2hk6s7qd3lqykazlircwdkp676d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[262144, 2048], [2048], [262144, 2048], [262144, 2048], [132, 2048], [262144], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 269 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_0", "pid": 1336759, "tid": 1381173, "ts": 1295650778046.018, "dur": 27.828, "args": { "External id": 17679,"kernel_hash": "cofxh4a56o46ifoz3xsku2krq37ug6i5slnssef2z53eyj4ipzd2", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/of/cofxh4a56o46ifoz3xsku2krq37ug6i5slnssef2z53eyj4ipzd2.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 270 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_1", "pid": 1336759, "tid": 1381173, "ts": 1295650778092.501, "dur": 15.917, "args": { "External id": 17680,"kernel_hash": "ckjxjmz2vylbnrnans6gouo3or7yw4dvfka55hu6q4kyfb7xeari", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/kj/ckjxjmz2vylbnrnans6gouo3or7yw4dvfka55hu6q4kyfb7xeari.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 271 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650778151.560, "dur": 14.054, "args": { "External id": 17681,"Record function id": 0, "Ev Idx": 272 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650778154.247, "dur": 10.430, "args": { "External id": 17682,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650778157.687, "dur": 6.090, "args": { "External id": 17683,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 274 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650778160.301, "dur": 3.304, "args": { "External id": 17684,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 275 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: StackBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650778172.208, "dur": 31.595, "args": { "External id": 17685,"Record function id": 0, "Sequence number": 246737, "Fwd thread id": 1, "Ev Idx": 276 } }, { "ph": "X", "cat": "cpu_op", "name": "StackBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650778173.307, "dur": 24.324, "args": { "External id": 17686,"Sequence number": 246737, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 277 } }, { "ph": "f", "id": 31, "pid": 1336759, "tid": 1381173, "ts": 1295650778173.307, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336759, "tid": 1381173, "ts": 1295650778175.590, "dur": 9.514, "args": { "External id": 17687,"Record function id": 0, "Concrete Inputs": ["", "-2", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778181.717, "dur": 1.492, "args": { "External id": 17688,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336759, "tid": 1381173, "ts": 1295650778185.902, "dur": 3.388, "args": { "External id": 17689,"Record function id": 0, "Concrete Inputs": ["", "-2", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778188.200, "dur": 0.393, "args": { "External id": 17690,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336759, "tid": 1381173, "ts": 1295650778190.007, "dur": 3.273, "args": { "External id": 17691,"Record function id": 0, "Concrete Inputs": ["", "-2", "2"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778191.942, "dur": 0.524, "args": { "External id": 17692,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "4096"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336759, "tid": 1381173, "ts": 1295650778194.104, "dur": 2.831, "args": { "External id": 17693,"Record function id": 0, "Concrete Inputs": ["", "-2", "3"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778195.890, "dur": 0.531, "args": { "External id": 17694,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "6144"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 285 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650778207.518, "dur": 4.636, "args": { "External id": 17695,"Record function id": 0, "Sequence number": 246736, "Fwd thread id": 1, "Ev Idx": 286 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650778208.405, "dur": 1.134, "args": { "External id": 17696,"Sequence number": 246736, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 287 } }, { "ph": "f", "id": 32, "pid": 1336759, "tid": 1381173, "ts": 1295650778208.405, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650778216.783, "dur": 488.065, "args": { "External id": 17697,"Record function id": 0, "Sequence number": 246735, "Fwd thread id": 1, "Ev Idx": 288 } }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650778218.157, "dur": 475.521, "args": { "External id": 17698,"Sequence number": 246735, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 289 } }, { "ph": "f", "id": 33, "pid": 1336759, "tid": 1381173, "ts": 1295650778218.157, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650778273.223, "dur": 12.997, "args": { "External id": 17699,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336759, "tid": 1381173, "ts": 1295650778280.038, "dur": 5.690, "args": { "External id": 17700,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]", "[8192, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[33554432, 8192, 1], [], []], "Input Dims": [[16, 4096, 2048], [], []], "Ev Idx": 291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650778290.714, "dur": 8.284, "args": { "External id": 17701,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650778293.159, "dur": 5.068, "args": { "External id": 17702,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778297.140, "dur": 0.857, "args": { "External id": 17703,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1381173, "ts": 1295650778302.805, "dur": 118.604, "args": { "External id": 17704,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8192, 1], [1, 5632], []], "Input Dims": [[65536, 2048], [5632, 2048], []], "Ev Idx": 295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650778303.714, "dur": 4.577, "args": { "External id": 17705,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 5632]], "Input Dims": [[5632, 2048]], "Ev Idx": 296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650778304.427, "dur": 3.229, "args": { "External id": 17706,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 5632], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778305.975, "dur": 1.532, "args": { "External id": 17707,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[5632, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 5632], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1381173, "ts": 1295650778309.742, "dur": 110.738, "args": { "External id": 17708,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650778313.907, "dur": 105.373, "args": { "External id": 17709,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1381173, "ts": 1295650778426.298, "dur": 5.129, "args": { "External id": 17710,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [23068672, 5632, 1]], "Input Dims": [[65536, 5632], [16, 4096, 5632]], "Ev Idx": 301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650778428.718, "dur": 2.548, "args": { "External id": 17711,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650778464.186, "dur": 4.812, "args": { "External id": 17712,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650778470.365, "dur": 2.563, "args": { "External id": 17713,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650778473.909, "dur": 1.596, "args": { "External id": 17714,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650778513.115, "dur": 2.422, "args": { "External id": 17715,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650778514.127, "dur": 1.259, "args": { "External id": 17716,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 1336759, "tid": 1381173, "ts": 1295650778541.340, "dur": 133.686, "args": { "External id": 17717,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[8192, 1], [5632, 1]], []], "Input Dims": [[], [[65536, 2048], [65536, 5632]], []], "Ev Idx": 308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1381173, "ts": 1295650778548.534, "dur": 7.688, "args": { "External id": 17718,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778553.582, "dur": 0.687, "args": { "External id": 17719,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048, 1]", "[8192, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650778558.421, "dur": 7.735, "args": { "External id": 17720,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8192, 1, 1], []], "Input Dims": [[65536, 2048, 1], []], "Ev Idx": 311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778563.652, "dur": 1.748, "args": { "External id": 17721,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 65536]", "[1, 1, 8192]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[65536, 2048, 1], [], [], []], "Ev Idx": 312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1381173, "ts": 1295650778568.050, "dur": 2.774, "args": { "External id": 17722,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778570.085, "dur": 0.335, "args": { "External id": 17723,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650778571.770, "dur": 3.197, "args": { "External id": 17724,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778573.967, "dur": 0.488, "args": { "External id": 17725,"Record function id": 0, "Concrete Inputs": ["", "[1, 5632, 65536]", "[1, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1, 1], [], [], []], "Input Dims": [[65536, 5632, 1], [], [], []], "Ev Idx": 316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650778581.858, "dur": 3.247, "args": { "External id": 17726,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 8192], []], "Input Dims": [[2048, 1, 65536], []], "Ev Idx": 317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778584.257, "dur": 0.493, "args": { "External id": 17727,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536, 1]", "[1, 8192, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 8192], [], [], []], "Input Dims": [[2048, 1, 65536], [], [], []], "Ev Idx": 318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650778586.335, "dur": 6.134, "args": { "External id": 17728,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 8192, 1], []], "Input Dims": [[2048, 65536, 1], []], "Ev Idx": 319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336759, "tid": 1381173, "ts": 1295650778590.456, "dur": 1.825, "args": { "External id": 17729,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]", "[2048, 1, 8192]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 8192, 1], [], []], "Input Dims": [[2048, 65536, 1], [], []], "Ev Idx": 320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650778593.424, "dur": 2.779, "args": { "External id": 17730,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 5632], []], "Input Dims": [[1, 5632, 65536], []], "Ev Idx": 321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778595.483, "dur": 0.383, "args": { "External id": 17731,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 5632], [], [], []], "Input Dims": [[1, 5632, 65536], [], [], []], "Ev Idx": 322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650778597.165, "dur": 2.529, "args": { "External id": 17732,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650778598.674, "dur": 0.899, "args": { "External id": 17733,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295650778601.519, "dur": 57.363, "args": { "External id": 17734,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1, 8192], [369098752, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632]], "Ev Idx": 325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650778662.861, "dur": 2.773, "args": { "External id": 17735,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 5632, 1], []], "Input Dims": [[1, 2048, 5632], []], "Ev Idx": 326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650778666.766, "dur": 3.483, "args": { "External id": 17736,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 5632, 1], []], "Input Dims": [[2048, 1, 5632], []], "Ev Idx": 327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778669.218, "dur": 0.425, "args": { "External id": 17737,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632, 1]", "[5632, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 5632, 1], [], [], []], "Input Dims": [[2048, 1, 5632], [], [], []], "Ev Idx": 328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650778672.533, "dur": 0.932, "args": { "External id": 17738,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 5632], []], "Input Dims": [[2048, 5632, 1], []], "Ev Idx": 329 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650778716.972, "dur": 10.744, "args": { "External id": 17739,"Record function id": 0, "Ev Idx": 330 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650778719.740, "dur": 7.140, "args": { "External id": 17740,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650778722.299, "dur": 3.515, "args": { "External id": 17741,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 332 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650778723.464, "dur": 2.232, "args": { "External id": 17742,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 333 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650778732.152, "dur": 9.786, "args": { "External id": 17743,"Record function id": 0, "Sequence number": 246734, "Fwd thread id": 1, "Ev Idx": 334 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650778733.615, "dur": 6.290, "args": { "External id": 17744,"Sequence number": 246734, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 335 } }, { "ph": "f", "id": 34, "pid": 1336759, "tid": 1381173, "ts": 1295650778733.615, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650778735.688, "dur": 3.998, "args": { "External id": 17745,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650778738.833, "dur": 0.762, "args": { "External id": 17746,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 337 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650778746.077, "dur": 165.005, "args": { "External id": 17747,"Record function id": 0, "Sequence number": 246733, "Fwd thread id": 1, "Ev Idx": 338 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650778747.105, "dur": 157.563, "args": { "External id": 17748,"Sequence number": 246733, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 339 } }, { "ph": "f", "id": 35, "pid": 1336759, "tid": 1381173, "ts": 1295650778747.105, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650778751.456, "dur": 4.312, "args": { "External id": 17749,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650778752.838, "dur": 2.384, "args": { "External id": 17750,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778754.483, "dur": 0.552, "args": { "External id": 17751,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650778757.024, "dur": 53.767, "args": { "External id": 17752,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650778814.537, "dur": 4.349, "args": { "External id": 17753,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650778815.562, "dur": 2.484, "args": { "External id": 17754,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778816.984, "dur": 0.913, "args": { "External id": 17755,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650778820.508, "dur": 3.696, "args": { "External id": 17756,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650778821.564, "dur": 2.143, "args": { "External id": 17757,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778823.144, "dur": 0.491, "args": { "External id": 17758,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650778826.683, "dur": 77.045, "args": { "External id": 17759,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 350 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650778915.726, "dur": 6.639, "args": { "External id": 17760,"Record function id": 0, "Sequence number": 246732, "Fwd thread id": 1, "Ev Idx": 351 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650778916.881, "dur": 3.875, "args": { "External id": 17761,"Sequence number": 246732, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 352 } }, { "ph": "f", "id": 36, "pid": 1336759, "tid": 1381173, "ts": 1295650778916.881, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650778918.266, "dur": 2.328, "args": { "External id": 17762,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650778919.402, "dur": 1.063, "args": { "External id": 17763,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 354 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650778926.208, "dur": 9.612, "args": { "External id": 17764,"Record function id": 0, "Sequence number": 246731, "Fwd thread id": 1, "Ev Idx": 355 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650778927.145, "dur": 6.262, "args": { "External id": 17765,"Sequence number": 246731, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 356 } }, { "ph": "f", "id": 37, "pid": 1336759, "tid": 1381173, "ts": 1295650778927.145, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650778928.151, "dur": 5.034, "args": { "External id": 17766,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650778928.883, "dur": 3.782, "args": { "External id": 17767,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778932.032, "dur": 0.457, "args": { "External id": 17768,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 359 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650778940.603, "dur": 5.522, "args": { "External id": 17769,"Record function id": 0, "Ev Idx": 360 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650778942.269, "dur": 3.356, "args": { "External id": 17770,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650778943.599, "dur": 1.763, "args": { "External id": 17771,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 362 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650778944.293, "dur": 0.974, "args": { "External id": 17772,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 363 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650778949.654, "dur": 5.308, "args": { "External id": 17773,"Record function id": 0, "Sequence number": 246730, "Fwd thread id": 1, "Ev Idx": 364 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650778950.993, "dur": 2.538, "args": { "External id": 17774,"Sequence number": 246730, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 365 } }, { "ph": "f", "id": 38, "pid": 1336759, "tid": 1381173, "ts": 1295650778950.993, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650778951.963, "dur": 1.407, "args": { "External id": 17775,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650778952.661, "dur": 0.570, "args": { "External id": 17776,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 367 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650778957.967, "dur": 192.091, "args": { "External id": 17777,"Record function id": 0, "Sequence number": 246729, "Fwd thread id": 1, "Ev Idx": 368 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650778958.818, "dur": 182.121, "args": { "External id": 17778,"Sequence number": 246729, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 369 } }, { "ph": "f", "id": 39, "pid": 1336759, "tid": 1381173, "ts": 1295650778958.818, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650778963.213, "dur": 3.327, "args": { "External id": 17779,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650778963.887, "dur": 2.222, "args": { "External id": 17780,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650778965.524, "dur": 0.445, "args": { "External id": 17781,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650778967.189, "dur": 83.978, "args": { "External id": 17782,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650779053.488, "dur": 7.020, "args": { "External id": 17783,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650779054.674, "dur": 5.055, "args": { "External id": 17784,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650779058.786, "dur": 0.804, "args": { "External id": 17785,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650779061.757, "dur": 5.013, "args": { "External id": 17786,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650779062.967, "dur": 3.336, "args": { "External id": 17787,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650779064.822, "dur": 1.351, "args": { "External id": 17788,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650779067.579, "dur": 72.480, "args": { "External id": 17789,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 380 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650779158.850, "dur": 34.459, "args": { "External id": 17790,"Record function id": 0, "Sequence number": 246728, "Fwd thread id": 1, "Ev Idx": 381 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650779160.349, "dur": 4.612, "args": { "External id": 17791,"Sequence number": 246728, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 382 } }, { "ph": "f", "id": 40, "pid": 1336759, "tid": 1381173, "ts": 1295650779160.349, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650779162.065, "dur": 2.756, "args": { "External id": 17792,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650779163.341, "dur": 1.328, "args": { "External id": 17793,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336759, "tid": 1381173, "ts": 1295650779167.995, "dur": 22.408, "args": { "External id": 17794,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 385 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650779199.617, "dur": 8.696, "args": { "External id": 17795,"Record function id": 0, "Sequence number": 246727, "Fwd thread id": 1, "Ev Idx": 386 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650779200.621, "dur": 5.679, "args": { "External id": 17796,"Sequence number": 246727, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 387 } }, { "ph": "f", "id": 41, "pid": 1336759, "tid": 1381173, "ts": 1295650779200.621, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650779201.583, "dur": 4.496, "args": { "External id": 17797,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650779202.681, "dur": 2.901, "args": { "External id": 17798,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650779204.931, "dur": 0.495, "args": { "External id": 17799,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 390 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650779212.706, "dur": 6.084, "args": { "External id": 17800,"Record function id": 0, "Ev Idx": 391 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650779214.368, "dur": 3.908, "args": { "External id": 17801,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650779215.692, "dur": 2.283, "args": { "External id": 17802,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 393 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650779216.379, "dur": 1.479, "args": { "External id": 17803,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 394 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650779223.259, "dur": 435.261, "args": { "External id": 17804,"Record function id": 0, "Sequence number": 246726, "Fwd thread id": 1, "Ev Idx": 395 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650779225.199, "dur": 420.286, "args": { "External id": 17805,"Sequence number": 246726, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 396 } }, { "ph": "f", "id": 42, "pid": 1336759, "tid": 1381173, "ts": 1295650779225.199, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336759, "tid": 1381173, "ts": 1295650779267.676, "dur": 42.559, "args": { "External id": 17806,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1381173, "ts": 1295650779269.309, "dur": 40.680, "args": { "External id": 17807,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650779272.506, "dur": 9.676, "args": { "External id": 17808,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650779277.073, "dur": 4.217, "args": { "External id": 17809,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650779283.752, "dur": 25.670, "args": { "External id": 17810,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650779321.451, "dur": 2.627, "args": { "External id": 17811,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650779322.485, "dur": 1.461, "args": { "External id": 17812,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650779327.788, "dur": 4.923, "args": { "External id": 17813,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650779330.662, "dur": 1.950, "args": { "External id": 17814,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650779345.470, "dur": 2.337, "args": { "External id": 17815,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650779360.104, "dur": 3.036, "args": { "External id": 17816,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650779535.590, "dur": 2.297, "args": { "External id": 17817,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1381173, "ts": 1295650779542.637, "dur": 34.431, "args": { "External id": 17818,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650779552.603, "dur": 0.982, "args": { "External id": 17819,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295650779582.653, "dur": 28.933, "args": { "External id": 17820,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295650779584.763, "dur": 26.619, "args": { "External id": 17821,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650779590.828, "dur": 3.611, "args": { "External id": 17822,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650779595.814, "dur": 14.959, "args": { "External id": 17823,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1381173, "ts": 1295650779616.059, "dur": 2.860, "args": { "External id": 17824,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650779617.706, "dur": 1.098, "args": { "External id": 17825,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650779625.002, "dur": 3.304, "args": { "External id": 17826,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650779626.952, "dur": 1.253, "args": { "External id": 17827,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650779633.678, "dur": 3.211, "args": { "External id": 17828,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650779635.031, "dur": 1.767, "args": { "External id": 17829,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 420 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650779671.416, "dur": 9.043, "args": { "External id": 17830,"Record function id": 0, "Ev Idx": 421 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650779673.946, "dur": 5.798, "args": { "External id": 17831,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650779675.845, "dur": 2.937, "args": { "External id": 17832,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 423 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650779676.904, "dur": 1.797, "args": { "External id": 17833,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 424 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650779684.511, "dur": 9.743, "args": { "External id": 17834,"Record function id": 0, "Sequence number": 246725, "Fwd thread id": 1, "Ev Idx": 425 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650779685.871, "dur": 5.905, "args": { "External id": 17835,"Sequence number": 246725, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 426 } }, { "ph": "f", "id": 43, "pid": 1336759, "tid": 1381173, "ts": 1295650779685.871, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650779689.577, "dur": 1.996, "args": { "External id": 17836,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650779690.459, "dur": 0.960, "args": { "External id": 17837,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 428 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650779697.853, "dur": 137.816, "args": { "External id": 17838,"Record function id": 0, "Sequence number": 246724, "Fwd thread id": 1, "Ev Idx": 429 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650779698.933, "dur": 133.033, "args": { "External id": 17839,"Sequence number": 246724, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 430 } }, { "ph": "f", "id": 44, "pid": 1336759, "tid": 1381173, "ts": 1295650779698.933, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650779701.602, "dur": 7.397, "args": { "External id": 17840,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650779703.140, "dur": 5.267, "args": { "External id": 17841,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650779707.471, "dur": 0.743, "args": { "External id": 17842,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650779710.385, "dur": 56.159, "args": { "External id": 17843,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650779767.564, "dur": 5.606, "args": { "External id": 17844,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650779768.647, "dur": 3.828, "args": { "External id": 17845,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650779770.921, "dur": 1.391, "args": { "External id": 17846,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650779774.816, "dur": 4.676, "args": { "External id": 17847,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650779775.550, "dur": 3.510, "args": { "External id": 17848,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650779778.650, "dur": 0.305, "args": { "External id": 17849,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650779780.162, "dur": 50.951, "args": { "External id": 17850,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 441 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650779840.682, "dur": 9.184, "args": { "External id": 17851,"Record function id": 0, "Sequence number": 246723, "Fwd thread id": 1, "Ev Idx": 442 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650779841.999, "dur": 5.815, "args": { "External id": 17852,"Sequence number": 246723, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 443 } }, { "ph": "f", "id": 45, "pid": 1336759, "tid": 1381173, "ts": 1295650779841.999, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650779844.150, "dur": 3.498, "args": { "External id": 17853,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650779845.148, "dur": 2.346, "args": { "External id": 17854,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 445 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650779853.220, "dur": 9.183, "args": { "External id": 17855,"Record function id": 0, "Sequence number": 246722, "Fwd thread id": 1, "Ev Idx": 446 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650779854.287, "dur": 6.236, "args": { "External id": 17856,"Sequence number": 246722, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 447 } }, { "ph": "f", "id": 46, "pid": 1336759, "tid": 1381173, "ts": 1295650779854.287, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650779855.179, "dur": 5.128, "args": { "External id": 17857,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650779856.149, "dur": 3.628, "args": { "External id": 17858,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650779859.162, "dur": 0.478, "args": { "External id": 17859,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 450 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650779866.687, "dur": 4.956, "args": { "External id": 17860,"Record function id": 0, "Ev Idx": 451 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650779868.660, "dur": 2.480, "args": { "External id": 17861,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650779869.475, "dur": 1.421, "args": { "External id": 17862,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 453 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650779869.854, "dur": 0.970, "args": { "External id": 17863,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 454 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650779874.611, "dur": 6.013, "args": { "External id": 17864,"Record function id": 0, "Sequence number": 246721, "Fwd thread id": 1, "Ev Idx": 455 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650779875.524, "dur": 3.402, "args": { "External id": 17865,"Sequence number": 246721, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 456 } }, { "ph": "f", "id": 47, "pid": 1336759, "tid": 1381173, "ts": 1295650779875.524, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650779876.708, "dur": 2.061, "args": { "External id": 17866,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650779877.530, "dur": 1.107, "args": { "External id": 17867,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 458 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650779884.814, "dur": 365.630, "args": { "External id": 17868,"Record function id": 0, "Sequence number": 246720, "Fwd thread id": 1, "Ev Idx": 459 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650779886.475, "dur": 328.434, "args": { "External id": 17869,"Sequence number": 246720, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 460 } }, { "ph": "f", "id": 48, "pid": 1336759, "tid": 1381173, "ts": 1295650779886.475, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650779899.454, "dur": 6.655, "args": { "External id": 17870,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650779902.526, "dur": 3.009, "args": { "External id": 17871,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650779908.002, "dur": 3.338, "args": { "External id": 17872,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650779909.537, "dur": 1.605, "args": { "External id": 17873,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650779913.120, "dur": 5.358, "args": { "External id": 17874,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650779915.212, "dur": 3.014, "args": { "External id": 17875,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 466 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650779949.447, "dur": 238.300, "args": { "External id": 17876,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650780077.353, "dur": 4.544, "args": { "External id": 17877,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650780084.294, "dur": 3.785, "args": { "External id": 17878,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336759, "tid": 1381173, "ts": 1295650780201.925, "dur": 3.975, "args": { "External id": 17879,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336759, "tid": 1381173, "ts": 1295650780208.700, "dur": 0.742, "args": { "External id": 17880,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336759, "tid": 1381173, "ts": 1295650780211.476, "dur": 0.695, "args": { "External id": 17881,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 472 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650780261.976, "dur": 232.391, "args": { "External id": 17882,"Record function id": 0, "Sequence number": 246719, "Fwd thread id": 1, "Ev Idx": 473 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650780264.245, "dur": 223.021, "args": { "External id": 17883,"Sequence number": 246719, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 474 } }, { "ph": "f", "id": 49, "pid": 1336759, "tid": 1381173, "ts": 1295650780264.245, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1381173, "ts": 1295650780286.388, "dur": 48.030, "args": { "External id": 17884,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650780289.831, "dur": 3.756, "args": { "External id": 17885,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650780294.994, "dur": 38.457, "args": { "External id": 17886,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650780344.151, "dur": 4.817, "args": { "External id": 17887,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650780346.451, "dur": 2.182, "args": { "External id": 17888,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 479 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650780501.571, "dur": 149.372, "args": { "External id": 17889,"Record function id": 0, "Sequence number": 246718, "Fwd thread id": 1, "Ev Idx": 480 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650780503.711, "dur": 141.586, "args": { "External id": 17890,"Sequence number": 246718, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 481 } }, { "ph": "f", "id": 50, "pid": 1336759, "tid": 1381173, "ts": 1295650780503.711, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1381173, "ts": 1295650780516.061, "dur": 29.737, "args": { "External id": 17891,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650780519.074, "dur": 2.461, "args": { "External id": 17892,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650780522.501, "dur": 22.752, "args": { "External id": 17893,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650780552.911, "dur": 4.168, "args": { "External id": 17894,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650780554.623, "dur": 2.186, "args": { "External id": 17895,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 486 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780658.118, "dur": 14.422, "args": { "External id": 17896,"Record function id": 0, "Sequence number": 246717, "Fwd thread id": 1, "Ev Idx": 487 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780659.454, "dur": 10.314, "args": { "External id": 17897,"Sequence number": 246717, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 488 } }, { "ph": "f", "id": 51, "pid": 1336759, "tid": 1381173, "ts": 1295650780659.454, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650780662.081, "dur": 7.419, "args": { "External id": 17898,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650780664.163, "dur": 5.123, "args": { "External id": 17899,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 490 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780676.231, "dur": 8.559, "args": { "External id": 17900,"Record function id": 0, "Sequence number": 246716, "Fwd thread id": 1, "Ev Idx": 491 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780677.126, "dur": 6.018, "args": { "External id": 17901,"Sequence number": 246716, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 492 } }, { "ph": "f", "id": 52, "pid": 1336759, "tid": 1381173, "ts": 1295650780677.126, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650780678.717, "dur": 4.289, "args": { "External id": 17902,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650780682.116, "dur": 0.750, "args": { "External id": 17903,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 494 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780687.694, "dur": 5.972, "args": { "External id": 17904,"Record function id": 0, "Sequence number": 246715, "Fwd thread id": 1, "Ev Idx": 495 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780688.634, "dur": 3.247, "args": { "External id": 17905,"Sequence number": 246715, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 496 } }, { "ph": "f", "id": 53, "pid": 1336759, "tid": 1381173, "ts": 1295650780688.634, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650780690.108, "dur": 1.632, "args": { "External id": 17906,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650780690.921, "dur": 0.692, "args": { "External id": 17907,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 498 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780697.128, "dur": 6.181, "args": { "External id": 17908,"Record function id": 0, "Sequence number": 246714, "Fwd thread id": 1, "Ev Idx": 499 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780698.760, "dur": 2.984, "args": { "External id": 17909,"Sequence number": 246714, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 500 } }, { "ph": "f", "id": 54, "pid": 1336759, "tid": 1381173, "ts": 1295650780698.760, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650780699.601, "dur": 1.991, "args": { "External id": 17910,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650780700.609, "dur": 0.885, "args": { "External id": 17911,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 502 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780706.814, "dur": 173.567, "args": { "External id": 17912,"Record function id": 0, "Sequence number": 246713, "Fwd thread id": 1, "Ev Idx": 503 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780710.017, "dur": 164.447, "args": { "External id": 17913,"Sequence number": 246713, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 504 } }, { "ph": "f", "id": 55, "pid": 1336759, "tid": 1381173, "ts": 1295650780710.017, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650780714.965, "dur": 7.438, "args": { "External id": 17914,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650780717.232, "dur": 4.477, "args": { "External id": 17915,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650780719.690, "dur": 1.755, "args": { "External id": 17916,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650780723.865, "dur": 65.229, "args": { "External id": 17917,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650780790.312, "dur": 7.077, "args": { "External id": 17918,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650780791.397, "dur": 5.146, "args": { "External id": 17919,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650780795.396, "dur": 1.017, "args": { "External id": 17920,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650780822.345, "dur": 3.546, "args": { "External id": 17921,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650780823.380, "dur": 2.033, "args": { "External id": 17922,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650780824.984, "dur": 0.365, "args": { "External id": 17923,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650780826.635, "dur": 46.861, "args": { "External id": 17924,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 515 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780885.493, "dur": 8.714, "args": { "External id": 17925,"Record function id": 0, "Sequence number": 246712, "Fwd thread id": 1, "Ev Idx": 516 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780886.376, "dur": 6.115, "args": { "External id": 17926,"Sequence number": 246712, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 517 } }, { "ph": "f", "id": 56, "pid": 1336759, "tid": 1381173, "ts": 1295650780886.376, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650780888.014, "dur": 4.336, "args": { "External id": 17927,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650780891.000, "dur": 1.249, "args": { "External id": 17928,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 519 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780897.528, "dur": 7.319, "args": { "External id": 17929,"Record function id": 0, "Sequence number": 246711, "Fwd thread id": 1, "Ev Idx": 520 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780898.314, "dur": 4.417, "args": { "External id": 17930,"Sequence number": 246711, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 521 } }, { "ph": "f", "id": 57, "pid": 1336759, "tid": 1381173, "ts": 1295650780898.314, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650780898.947, "dur": 3.579, "args": { "External id": 17931,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650780899.580, "dur": 2.433, "args": { "External id": 17932,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650780901.440, "dur": 0.466, "args": { "External id": 17933,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 524 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650780910.866, "dur": 11.235, "args": { "External id": 17934,"Record function id": 0, "Ev Idx": 525 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650780912.935, "dur": 8.332, "args": { "External id": 17935,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650780915.376, "dur": 5.560, "args": { "External id": 17936,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 527 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650780918.437, "dur": 2.341, "args": { "External id": 17937,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 528 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780927.316, "dur": 5.866, "args": { "External id": 17938,"Record function id": 0, "Sequence number": 246710, "Fwd thread id": 1, "Ev Idx": 529 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780928.620, "dur": 2.835, "args": { "External id": 17939,"Sequence number": 246710, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 530 } }, { "ph": "f", "id": 58, "pid": 1336759, "tid": 1381173, "ts": 1295650780928.620, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650780929.558, "dur": 1.765, "args": { "External id": 17940,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650780930.421, "dur": 0.804, "args": { "External id": 17941,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 532 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780936.342, "dur": 137.930, "args": { "External id": 17942,"Record function id": 0, "Sequence number": 246709, "Fwd thread id": 1, "Ev Idx": 533 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650780937.122, "dur": 129.703, "args": { "External id": 17943,"Sequence number": 246709, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 534 } }, { "ph": "f", "id": 59, "pid": 1336759, "tid": 1381173, "ts": 1295650780937.122, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650780939.171, "dur": 4.060, "args": { "External id": 17944,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650780939.597, "dur": 3.181, "args": { "External id": 17945,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 536 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650780942.306, "dur": 0.370, "args": { "External id": 17946,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650780943.844, "dur": 27.252, "args": { "External id": 17947,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650780972.215, "dur": 3.657, "args": { "External id": 17948,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650780972.746, "dur": 2.570, "args": { "External id": 17949,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650780974.505, "dur": 0.697, "args": { "External id": 17950,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650780976.895, "dur": 6.900, "args": { "External id": 17951,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650780979.683, "dur": 3.646, "args": { "External id": 17952,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650780981.406, "dur": 1.851, "args": { "External id": 17953,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650781025.832, "dur": 39.797, "args": { "External id": 17954,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 545 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650781080.718, "dur": 32.657, "args": { "External id": 17955,"Record function id": 0, "Sequence number": 246708, "Fwd thread id": 1, "Ev Idx": 546 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650781081.645, "dur": 3.937, "args": { "External id": 17956,"Sequence number": 246708, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 547 } }, { "ph": "f", "id": 60, "pid": 1336759, "tid": 1381173, "ts": 1295650781081.645, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650781083.319, "dur": 2.124, "args": { "External id": 17957,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650781084.057, "dur": 1.290, "args": { "External id": 17958,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336759, "tid": 1381173, "ts": 1295650781088.861, "dur": 21.998, "args": { "External id": 17959,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 550 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650781117.085, "dur": 10.625, "args": { "External id": 17960,"Record function id": 0, "Sequence number": 246707, "Fwd thread id": 1, "Ev Idx": 551 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650781118.009, "dur": 7.869, "args": { "External id": 17961,"Sequence number": 246707, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 552 } }, { "ph": "f", "id": 61, "pid": 1336759, "tid": 1381173, "ts": 1295650781118.009, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650781121.491, "dur": 4.207, "args": { "External id": 17962,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650781122.307, "dur": 2.730, "args": { "External id": 17963,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650781124.345, "dur": 0.602, "args": { "External id": 17964,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 555 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650781131.982, "dur": 6.288, "args": { "External id": 17965,"Record function id": 0, "Ev Idx": 556 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650781133.781, "dur": 3.899, "args": { "External id": 17966,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650781135.147, "dur": 2.221, "args": { "External id": 17967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 558 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650781135.695, "dur": 1.561, "args": { "External id": 17968,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 559 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650781141.606, "dur": 9.309, "args": { "External id": 17969,"Record function id": 0, "Sequence number": 246706, "Fwd thread id": 1, "Ev Idx": 560 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650781143.402, "dur": 5.481, "args": { "External id": 17970,"Sequence number": 246706, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 561 } }, { "ph": "f", "id": 62, "pid": 1336759, "tid": 1381173, "ts": 1295650781143.402, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650781144.558, "dur": 4.191, "args": { "External id": 17971,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650781147.740, "dur": 0.909, "args": { "External id": 17972,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 563 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650781154.038, "dur": 106.274, "args": { "External id": 17973,"Record function id": 0, "Sequence number": 246705, "Fwd thread id": 1, "Ev Idx": 564 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650781154.666, "dur": 96.970, "args": { "External id": 17974,"Sequence number": 246705, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 565 } }, { "ph": "f", "id": 63, "pid": 1336759, "tid": 1381173, "ts": 1295650781154.666, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650781156.603, "dur": 3.229, "args": { "External id": 17975,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650781157.025, "dur": 2.332, "args": { "External id": 17976,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650781158.769, "dur": 0.472, "args": { "External id": 17977,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650781160.455, "dur": 28.345, "args": { "External id": 17978,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650781192.075, "dur": 3.142, "args": { "External id": 17979,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650781192.560, "dur": 2.097, "args": { "External id": 17980,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 571 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650781194.024, "dur": 0.531, "args": { "External id": 17981,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650781196.230, "dur": 3.273, "args": { "External id": 17982,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650781197.468, "dur": 1.606, "args": { "External id": 17983,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650781198.790, "dur": 0.196, "args": { "External id": 17984,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650781201.726, "dur": 48.562, "args": { "External id": 17985,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 576 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650781267.172, "dur": 27.023, "args": { "External id": 17986,"Record function id": 0, "Sequence number": 246704, "Fwd thread id": 1, "Ev Idx": 577 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650781268.174, "dur": 4.618, "args": { "External id": 17987,"Sequence number": 246704, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 578 } }, { "ph": "f", "id": 64, "pid": 1336759, "tid": 1381173, "ts": 1295650781268.174, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650781269.980, "dur": 2.642, "args": { "External id": 17988,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650781270.939, "dur": 1.551, "args": { "External id": 17989,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1381173, "ts": 1295650781275.333, "dur": 17.088, "args": { "External id": 17990,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 581 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650781297.687, "dur": 12.056, "args": { "External id": 17991,"Record function id": 0, "Sequence number": 246703, "Fwd thread id": 1, "Ev Idx": 582 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650781298.601, "dur": 9.447, "args": { "External id": 17992,"Sequence number": 246703, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 583 } }, { "ph": "f", "id": 65, "pid": 1336759, "tid": 1381173, "ts": 1295650781298.601, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650781299.411, "dur": 8.428, "args": { "External id": 17993,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650781303.260, "dur": 4.021, "args": { "External id": 17994,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650781306.618, "dur": 0.572, "args": { "External id": 17995,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 586 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650781313.891, "dur": 5.428, "args": { "External id": 17996,"Record function id": 0, "Ev Idx": 587 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650781315.543, "dur": 3.292, "args": { "External id": 17997,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650781316.870, "dur": 1.667, "args": { "External id": 17998,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 589 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650781317.248, "dur": 1.209, "args": { "External id": 17999,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 590 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650781323.735, "dur": 353.984, "args": { "External id": 18000,"Record function id": 0, "Sequence number": 246702, "Fwd thread id": 1, "Ev Idx": 591 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650781325.449, "dur": 323.103, "args": { "External id": 18001,"Sequence number": 246702, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 592 } }, { "ph": "f", "id": 66, "pid": 1336759, "tid": 1381173, "ts": 1295650781325.449, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650781360.974, "dur": 2.261, "args": { "External id": 18002,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650781361.922, "dur": 1.156, "args": { "External id": 18003,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650781379.314, "dur": 5.658, "args": { "External id": 18004,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650781394.813, "dur": 1.842, "args": { "External id": 18005,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650781550.403, "dur": 1.656, "args": { "External id": 18006,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1381173, "ts": 1295650781556.142, "dur": 33.762, "args": { "External id": 18007,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650781566.217, "dur": 1.086, "args": { "External id": 18008,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295650781595.637, "dur": 29.546, "args": { "External id": 18009,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295650781597.434, "dur": 27.515, "args": { "External id": 18010,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650781601.823, "dur": 5.327, "args": { "External id": 18011,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650781608.908, "dur": 15.371, "args": { "External id": 18012,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1381173, "ts": 1295650781631.596, "dur": 2.289, "args": { "External id": 18013,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650781632.714, "dur": 1.031, "args": { "External id": 18014,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650781639.997, "dur": 2.172, "args": { "External id": 18015,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650781641.096, "dur": 0.983, "args": { "External id": 18016,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336759, "tid": 1381173, "ts": 1295650781657.475, "dur": 14.901, "args": { "External id": 18017,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 608 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650781686.022, "dur": 9.693, "args": { "External id": 18018,"Record function id": 0, "Ev Idx": 609 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650781688.348, "dur": 6.684, "args": { "External id": 18019,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650781689.615, "dur": 4.494, "args": { "External id": 18020,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 611 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650781692.707, "dur": 1.289, "args": { "External id": 18021,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 612 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650781701.512, "dur": 5.326, "args": { "External id": 18022,"Record function id": 0, "Sequence number": 246701, "Fwd thread id": 1, "Ev Idx": 613 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650781702.515, "dur": 1.040, "args": { "External id": 18023,"Sequence number": 246701, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 614 } }, { "ph": "f", "id": 67, "pid": 1336759, "tid": 1381173, "ts": 1295650781702.515, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650781711.341, "dur": 432.049, "args": { "External id": 18024,"Record function id": 0, "Sequence number": 246700, "Fwd thread id": 1, "Ev Idx": 615 } }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650781712.912, "dur": 419.812, "args": { "External id": 18025,"Sequence number": 246700, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 616 } }, { "ph": "f", "id": 68, "pid": 1336759, "tid": 1381173, "ts": 1295650781712.912, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650781741.545, "dur": 9.097, "args": { "External id": 18026,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336759, "tid": 1381173, "ts": 1295650781747.350, "dur": 2.985, "args": { "External id": 18027,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]", "[8192, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[33554432, 8192, 1], [], []], "Input Dims": [[16, 4096, 2048], [], []], "Ev Idx": 618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650781753.498, "dur": 5.984, "args": { "External id": 18028,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650781754.756, "dur": 4.120, "args": { "External id": 18029,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650781757.976, "dur": 0.744, "args": { "External id": 18030,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1381173, "ts": 1295650781763.062, "dur": 82.269, "args": { "External id": 18031,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8192, 1], [1, 5632], []], "Input Dims": [[65536, 2048], [5632, 2048], []], "Ev Idx": 622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650781764.151, "dur": 4.111, "args": { "External id": 18032,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 5632]], "Input Dims": [[5632, 2048]], "Ev Idx": 623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650781764.593, "dur": 3.233, "args": { "External id": 18033,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 5632], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650781766.136, "dur": 1.605, "args": { "External id": 18034,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[5632, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 5632], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1381173, "ts": 1295650781769.404, "dur": 75.419, "args": { "External id": 18035,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650781772.972, "dur": 71.016, "args": { "External id": 18036,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1381173, "ts": 1295650781848.665, "dur": 2.578, "args": { "External id": 18037,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [23068672, 5632, 1]], "Input Dims": [[65536, 5632], [16, 4096, 5632]], "Ev Idx": 628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650781849.813, "dur": 1.288, "args": { "External id": 18038,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650781882.232, "dur": 4.009, "args": { "External id": 18039,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650781887.608, "dur": 1.441, "args": { "External id": 18040,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650781890.083, "dur": 1.511, "args": { "External id": 18041,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650781923.532, "dur": 2.537, "args": { "External id": 18042,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650781924.533, "dur": 1.376, "args": { "External id": 18043,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 1336759, "tid": 1381173, "ts": 1295650781945.609, "dur": 168.310, "args": { "External id": 18044,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[8192, 1], [5632, 1]], []], "Input Dims": [[], [[65536, 2048], [65536, 5632]], []], "Ev Idx": 635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1381173, "ts": 1295650781950.726, "dur": 5.223, "args": { "External id": 18045,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650781954.500, "dur": 0.759, "args": { "External id": 18046,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048, 1]", "[8192, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650781958.098, "dur": 6.564, "args": { "External id": 18047,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8192, 1, 1], []], "Input Dims": [[65536, 2048, 1], []], "Ev Idx": 638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650781962.419, "dur": 1.577, "args": { "External id": 18048,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 65536]", "[1, 1, 8192]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[65536, 2048, 1], [], [], []], "Ev Idx": 639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1381173, "ts": 1295650781965.983, "dur": 2.326, "args": { "External id": 18049,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650781967.645, "dur": 0.306, "args": { "External id": 18050,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650781969.446, "dur": 3.099, "args": { "External id": 18051,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 642 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650781971.661, "dur": 0.447, "args": { "External id": 18052,"Record function id": 0, "Concrete Inputs": ["", "[1, 5632, 65536]", "[1, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1, 1], [], [], []], "Input Dims": [[65536, 5632, 1], [], [], []], "Ev Idx": 643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650781977.919, "dur": 2.618, "args": { "External id": 18053,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 8192], []], "Input Dims": [[2048, 1, 65536], []], "Ev Idx": 644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650781979.814, "dur": 0.401, "args": { "External id": 18054,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536, 1]", "[1, 8192, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 8192], [], [], []], "Input Dims": [[2048, 1, 65536], [], [], []], "Ev Idx": 645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650781981.887, "dur": 49.178, "args": { "External id": 18055,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 8192, 1], []], "Input Dims": [[2048, 65536, 1], []], "Ev Idx": 646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336759, "tid": 1381173, "ts": 1295650782027.962, "dur": 2.690, "args": { "External id": 18056,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]", "[2048, 1, 8192]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 8192, 1], [], []], "Input Dims": [[2048, 65536, 1], [], []], "Ev Idx": 647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650782032.360, "dur": 2.840, "args": { "External id": 18057,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 5632], []], "Input Dims": [[1, 5632, 65536], []], "Ev Idx": 648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650782034.505, "dur": 0.339, "args": { "External id": 18058,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 5632], [], [], []], "Input Dims": [[1, 5632, 65536], [], [], []], "Ev Idx": 649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650782036.391, "dur": 3.462, "args": { "External id": 18059,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650782037.471, "dur": 2.245, "args": { "External id": 18060,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295650782041.305, "dur": 57.803, "args": { "External id": 18061,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1, 8192], [369098752, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632]], "Ev Idx": 652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650782102.868, "dur": 2.023, "args": { "External id": 18062,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 5632, 1], []], "Input Dims": [[1, 2048, 5632], []], "Ev Idx": 653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650782105.931, "dur": 3.249, "args": { "External id": 18063,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 5632, 1], []], "Input Dims": [[2048, 1, 5632], []], "Ev Idx": 654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650782108.224, "dur": 0.432, "args": { "External id": 18064,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632, 1]", "[5632, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 5632, 1], [], [], []], "Input Dims": [[2048, 1, 5632], [], [], []], "Ev Idx": 655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650782111.761, "dur": 0.994, "args": { "External id": 18065,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 5632], []], "Input Dims": [[2048, 5632, 1], []], "Ev Idx": 656 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650782155.298, "dur": 9.751, "args": { "External id": 18066,"Record function id": 0, "Ev Idx": 657 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650782157.843, "dur": 6.467, "args": { "External id": 18067,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650782160.113, "dur": 3.122, "args": { "External id": 18068,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 659 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650782161.189, "dur": 1.919, "args": { "External id": 18069,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 660 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782168.863, "dur": 9.155, "args": { "External id": 18070,"Record function id": 0, "Sequence number": 246699, "Fwd thread id": 1, "Ev Idx": 661 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782170.237, "dur": 6.012, "args": { "External id": 18071,"Sequence number": 246699, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 662 } }, { "ph": "f", "id": 69, "pid": 1336759, "tid": 1381173, "ts": 1295650782170.237, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650782171.699, "dur": 4.322, "args": { "External id": 18072,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650782175.113, "dur": 0.775, "args": { "External id": 18073,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 664 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782181.638, "dur": 142.229, "args": { "External id": 18074,"Record function id": 0, "Sequence number": 246698, "Fwd thread id": 1, "Ev Idx": 665 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782182.609, "dur": 133.606, "args": { "External id": 18075,"Sequence number": 246698, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 666 } }, { "ph": "f", "id": 70, "pid": 1336759, "tid": 1381173, "ts": 1295650782182.609, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650782185.870, "dur": 3.921, "args": { "External id": 18076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650782187.046, "dur": 2.177, "args": { "External id": 18077,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650782188.674, "dur": 0.394, "args": { "External id": 18078,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650782190.794, "dur": 55.582, "args": { "External id": 18079,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650782250.738, "dur": 5.003, "args": { "External id": 18080,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650782251.509, "dur": 3.223, "args": { "External id": 18081,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650782253.492, "dur": 1.048, "args": { "External id": 18082,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650782257.300, "dur": 3.249, "args": { "External id": 18083,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 674 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650782258.017, "dur": 1.864, "args": { "External id": 18084,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 675 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650782259.549, "dur": 0.232, "args": { "External id": 18085,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650782263.073, "dur": 52.152, "args": { "External id": 18086,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 677 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782329.865, "dur": 7.214, "args": { "External id": 18087,"Record function id": 0, "Sequence number": 246697, "Fwd thread id": 1, "Ev Idx": 678 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782330.789, "dur": 4.799, "args": { "External id": 18088,"Sequence number": 246697, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 679 } }, { "ph": "f", "id": 71, "pid": 1336759, "tid": 1381173, "ts": 1295650782330.789, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650782332.606, "dur": 2.833, "args": { "External id": 18089,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650782333.830, "dur": 1.472, "args": { "External id": 18090,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 681 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782340.285, "dur": 7.117, "args": { "External id": 18091,"Record function id": 0, "Sequence number": 246696, "Fwd thread id": 1, "Ev Idx": 682 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782341.043, "dur": 4.026, "args": { "External id": 18092,"Sequence number": 246696, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 683 } }, { "ph": "f", "id": 72, "pid": 1336759, "tid": 1381173, "ts": 1295650782341.043, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650782341.643, "dur": 3.202, "args": { "External id": 18093,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650782342.292, "dur": 2.041, "args": { "External id": 18094,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650782343.876, "dur": 0.324, "args": { "External id": 18095,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 686 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650782351.782, "dur": 7.484, "args": { "External id": 18096,"Record function id": 0, "Ev Idx": 687 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650782353.342, "dur": 5.445, "args": { "External id": 18097,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650782354.556, "dur": 3.968, "args": { "External id": 18098,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 689 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650782357.322, "dur": 1.079, "args": { "External id": 18099,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 690 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782362.500, "dur": 6.194, "args": { "External id": 18100,"Record function id": 0, "Sequence number": 246695, "Fwd thread id": 1, "Ev Idx": 691 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782363.959, "dur": 2.666, "args": { "External id": 18101,"Sequence number": 246695, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 692 } }, { "ph": "f", "id": 73, "pid": 1336759, "tid": 1381173, "ts": 1295650782363.959, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650782365.024, "dur": 1.473, "args": { "External id": 18102,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650782365.744, "dur": 0.620, "args": { "External id": 18103,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 694 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782371.680, "dur": 111.235, "args": { "External id": 18104,"Record function id": 0, "Sequence number": 246694, "Fwd thread id": 1, "Ev Idx": 695 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782372.357, "dur": 103.441, "args": { "External id": 18105,"Sequence number": 246694, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 696 } }, { "ph": "f", "id": 74, "pid": 1336759, "tid": 1381173, "ts": 1295650782372.357, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650782374.419, "dur": 8.576, "args": { "External id": 18106,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650782377.275, "dur": 5.279, "args": { "External id": 18107,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650782382.060, "dur": 0.356, "args": { "External id": 18108,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650782383.590, "dur": 34.770, "args": { "External id": 18109,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650782419.461, "dur": 4.450, "args": { "External id": 18110,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650782419.922, "dur": 3.347, "args": { "External id": 18111,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650782421.705, "dur": 1.429, "args": { "External id": 18112,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650782426.906, "dur": 3.725, "args": { "External id": 18113,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650782427.349, "dur": 2.794, "args": { "External id": 18114,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650782428.706, "dur": 1.354, "args": { "External id": 18115,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650782431.071, "dur": 44.021, "args": { "External id": 18116,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 707 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782487.081, "dur": 29.130, "args": { "External id": 18117,"Record function id": 0, "Sequence number": 246693, "Fwd thread id": 1, "Ev Idx": 708 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782487.908, "dur": 3.904, "args": { "External id": 18118,"Sequence number": 246693, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 709 } }, { "ph": "f", "id": 75, "pid": 1336759, "tid": 1381173, "ts": 1295650782487.908, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650782489.366, "dur": 2.297, "args": { "External id": 18119,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650782490.339, "dur": 1.193, "args": { "External id": 18120,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336759, "tid": 1381173, "ts": 1295650782494.266, "dur": 19.407, "args": { "External id": 18121,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 712 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782519.936, "dur": 8.794, "args": { "External id": 18122,"Record function id": 0, "Sequence number": 246692, "Fwd thread id": 1, "Ev Idx": 713 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782522.729, "dur": 4.419, "args": { "External id": 18123,"Sequence number": 246692, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 714 } }, { "ph": "f", "id": 76, "pid": 1336759, "tid": 1381173, "ts": 1295650782522.729, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650782523.499, "dur": 3.411, "args": { "External id": 18124,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650782524.194, "dur": 2.191, "args": { "External id": 18125,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650782525.915, "dur": 0.352, "args": { "External id": 18126,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 717 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650782532.722, "dur": 4.732, "args": { "External id": 18127,"Record function id": 0, "Ev Idx": 718 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650782534.114, "dur": 2.743, "args": { "External id": 18128,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650782535.008, "dur": 1.595, "args": { "External id": 18129,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 720 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650782535.574, "dur": 0.918, "args": { "External id": 18130,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 721 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650782543.632, "dur": 383.781, "args": { "External id": 18131,"Record function id": 0, "Sequence number": 246691, "Fwd thread id": 1, "Ev Idx": 722 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650782545.159, "dur": 353.722, "args": { "External id": 18132,"Sequence number": 246691, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 723 } }, { "ph": "f", "id": 77, "pid": 1336759, "tid": 1381173, "ts": 1295650782545.159, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336759, "tid": 1381173, "ts": 1295650782568.815, "dur": 32.079, "args": { "External id": 18133,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1381173, "ts": 1295650782570.413, "dur": 30.219, "args": { "External id": 18134,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650782573.528, "dur": 6.059, "args": { "External id": 18135,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650782575.976, "dur": 3.077, "args": { "External id": 18136,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650782580.873, "dur": 19.377, "args": { "External id": 18137,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 728 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650782612.745, "dur": 2.198, "args": { "External id": 18138,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650782613.740, "dur": 1.074, "args": { "External id": 18139,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650782618.752, "dur": 2.624, "args": { "External id": 18140,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650782619.383, "dur": 1.894, "args": { "External id": 18141,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650782634.435, "dur": 2.390, "args": { "External id": 18142,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650782647.534, "dur": 1.809, "args": { "External id": 18143,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650782799.408, "dur": 2.238, "args": { "External id": 18144,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1381173, "ts": 1295650782805.717, "dur": 29.360, "args": { "External id": 18145,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650782814.098, "dur": 0.693, "args": { "External id": 18146,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295650782840.434, "dur": 29.214, "args": { "External id": 18147,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295650782842.268, "dur": 27.097, "args": { "External id": 18148,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650782846.585, "dur": 3.613, "args": { "External id": 18149,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650782854.069, "dur": 14.829, "args": { "External id": 18150,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1381173, "ts": 1295650782873.800, "dur": 2.375, "args": { "External id": 18151,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650782875.022, "dur": 1.021, "args": { "External id": 18152,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650782882.089, "dur": 2.093, "args": { "External id": 18153,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650782883.069, "dur": 1.000, "args": { "External id": 18154,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650782886.353, "dur": 2.621, "args": { "External id": 18155,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650782887.194, "dur": 1.689, "args": { "External id": 18156,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1381173, "ts": 1295650782910.161, "dur": 15.650, "args": { "External id": 18157,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 748 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650782937.014, "dur": 7.055, "args": { "External id": 18158,"Record function id": 0, "Ev Idx": 749 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650782939.282, "dur": 4.089, "args": { "External id": 18159,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650782940.891, "dur": 1.699, "args": { "External id": 18160,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 751 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650782941.500, "dur": 0.984, "args": { "External id": 18161,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 752 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782948.094, "dur": 7.724, "args": { "External id": 18162,"Record function id": 0, "Sequence number": 246690, "Fwd thread id": 1, "Ev Idx": 753 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782949.533, "dur": 4.003, "args": { "External id": 18163,"Sequence number": 246690, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 754 } }, { "ph": "f", "id": 78, "pid": 1336759, "tid": 1381173, "ts": 1295650782949.533, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650782951.267, "dur": 2.083, "args": { "External id": 18164,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650782952.108, "dur": 1.127, "args": { "External id": 18165,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 756 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782960.879, "dur": 167.655, "args": { "External id": 18166,"Record function id": 0, "Sequence number": 246689, "Fwd thread id": 1, "Ev Idx": 757 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650782961.809, "dur": 159.990, "args": { "External id": 18167,"Sequence number": 246689, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 758 } }, { "ph": "f", "id": 79, "pid": 1336759, "tid": 1381173, "ts": 1295650782961.809, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650782964.097, "dur": 4.636, "args": { "External id": 18168,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650782965.104, "dur": 3.078, "args": { "External id": 18169,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650782967.291, "dur": 0.763, "args": { "External id": 18170,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650782969.711, "dur": 94.532, "args": { "External id": 18171,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650783066.781, "dur": 7.709, "args": { "External id": 18172,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650783069.635, "dur": 3.927, "args": { "External id": 18173,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650783071.881, "dur": 1.441, "args": { "External id": 18174,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650783076.044, "dur": 3.166, "args": { "External id": 18175,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650783076.904, "dur": 1.826, "args": { "External id": 18176,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650783078.270, "dur": 0.373, "args": { "External id": 18177,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650783079.815, "dur": 40.844, "args": { "External id": 18178,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 769 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650783134.874, "dur": 10.099, "args": { "External id": 18179,"Record function id": 0, "Sequence number": 246688, "Fwd thread id": 1, "Ev Idx": 770 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650783138.249, "dur": 5.204, "args": { "External id": 18180,"Sequence number": 246688, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 771 } }, { "ph": "f", "id": 80, "pid": 1336759, "tid": 1381173, "ts": 1295650783138.249, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650783139.898, "dur": 3.402, "args": { "External id": 18181,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650783140.807, "dur": 2.347, "args": { "External id": 18182,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 773 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650783148.058, "dur": 6.772, "args": { "External id": 18183,"Record function id": 0, "Sequence number": 246687, "Fwd thread id": 1, "Ev Idx": 774 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650783148.879, "dur": 4.123, "args": { "External id": 18184,"Sequence number": 246687, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 775 } }, { "ph": "f", "id": 81, "pid": 1336759, "tid": 1381173, "ts": 1295650783148.879, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650783149.646, "dur": 3.181, "args": { "External id": 18185,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650783150.196, "dur": 2.138, "args": { "External id": 18186,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650783151.922, "dur": 0.290, "args": { "External id": 18187,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 778 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650783159.316, "dur": 8.620, "args": { "External id": 18188,"Record function id": 0, "Ev Idx": 779 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650783161.086, "dur": 6.320, "args": { "External id": 18189,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650783162.592, "dur": 4.526, "args": { "External id": 18190,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 781 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650783165.852, "dur": 1.144, "args": { "External id": 18191,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 782 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650783170.994, "dur": 6.059, "args": { "External id": 18192,"Record function id": 0, "Sequence number": 246686, "Fwd thread id": 1, "Ev Idx": 783 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650783171.796, "dur": 3.400, "args": { "External id": 18193,"Sequence number": 246686, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 784 } }, { "ph": "f", "id": 82, "pid": 1336759, "tid": 1381173, "ts": 1295650783171.796, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650783172.985, "dur": 2.053, "args": { "External id": 18194,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650783173.776, "dur": 1.129, "args": { "External id": 18195,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 786 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650783181.291, "dur": 301.480, "args": { "External id": 18196,"Record function id": 0, "Sequence number": 246685, "Fwd thread id": 1, "Ev Idx": 787 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650783183.156, "dur": 282.095, "args": { "External id": 18197,"Sequence number": 246685, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 788 } }, { "ph": "f", "id": 83, "pid": 1336759, "tid": 1381173, "ts": 1295650783183.156, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650783197.319, "dur": 7.291, "args": { "External id": 18198,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650783200.550, "dur": 3.515, "args": { "External id": 18199,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650783206.606, "dur": 3.361, "args": { "External id": 18200,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650783208.143, "dur": 1.613, "args": { "External id": 18201,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650783211.830, "dur": 5.233, "args": { "External id": 18202,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650783214.153, "dur": 2.708, "args": { "External id": 18203,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 794 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650783264.964, "dur": 174.086, "args": { "External id": 18204,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650783345.882, "dur": 4.075, "args": { "External id": 18205,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650783351.950, "dur": 3.390, "args": { "External id": 18206,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336759, "tid": 1381173, "ts": 1295650783452.384, "dur": 3.951, "args": { "External id": 18207,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336759, "tid": 1381173, "ts": 1295650783459.362, "dur": 0.674, "args": { "External id": 18208,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336759, "tid": 1381173, "ts": 1295650783462.077, "dur": 0.516, "args": { "External id": 18209,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 800 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650783492.269, "dur": 216.967, "args": { "External id": 18210,"Record function id": 0, "Sequence number": 246684, "Fwd thread id": 1, "Ev Idx": 801 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650783494.145, "dur": 209.113, "args": { "External id": 18211,"Sequence number": 246684, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 802 } }, { "ph": "f", "id": 84, "pid": 1336759, "tid": 1381173, "ts": 1295650783494.145, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1381173, "ts": 1295650783512.866, "dur": 44.039, "args": { "External id": 18212,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650783516.067, "dur": 2.906, "args": { "External id": 18213,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650783520.403, "dur": 35.735, "args": { "External id": 18214,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650783565.995, "dur": 4.254, "args": { "External id": 18215,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650783567.794, "dur": 2.194, "args": { "External id": 18216,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 807 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650783715.788, "dur": 140.410, "args": { "External id": 18217,"Record function id": 0, "Sequence number": 246683, "Fwd thread id": 1, "Ev Idx": 808 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650783717.901, "dur": 133.288, "args": { "External id": 18218,"Sequence number": 246683, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 809 } }, { "ph": "f", "id": 85, "pid": 1336759, "tid": 1381173, "ts": 1295650783717.901, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1381173, "ts": 1295650783729.837, "dur": 30.064, "args": { "External id": 18219,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650783732.110, "dur": 2.351, "args": { "External id": 18220,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650783735.498, "dur": 23.863, "args": { "External id": 18221,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650783766.754, "dur": 3.840, "args": { "External id": 18222,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650783768.612, "dur": 1.697, "args": { "External id": 18223,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 814 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650783861.922, "dur": 14.351, "args": { "External id": 18224,"Record function id": 0, "Sequence number": 246682, "Fwd thread id": 1, "Ev Idx": 815 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650783865.239, "dur": 8.798, "args": { "External id": 18225,"Sequence number": 246682, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 816 } }, { "ph": "f", "id": 86, "pid": 1336759, "tid": 1381173, "ts": 1295650783865.239, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650783867.710, "dur": 6.082, "args": { "External id": 18226,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650783869.358, "dur": 4.250, "args": { "External id": 18227,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 818 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650783879.900, "dur": 6.211, "args": { "External id": 18228,"Record function id": 0, "Sequence number": 246681, "Fwd thread id": 1, "Ev Idx": 819 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650783880.710, "dur": 3.526, "args": { "External id": 18229,"Sequence number": 246681, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 820 } }, { "ph": "f", "id": 87, "pid": 1336759, "tid": 1381173, "ts": 1295650783880.710, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650783882.148, "dur": 1.950, "args": { "External id": 18230,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650783883.318, "dur": 0.687, "args": { "External id": 18231,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 822 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650783891.358, "dur": 7.598, "args": { "External id": 18232,"Record function id": 0, "Sequence number": 246680, "Fwd thread id": 1, "Ev Idx": 823 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650783892.135, "dur": 5.143, "args": { "External id": 18233,"Sequence number": 246680, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 824 } }, { "ph": "f", "id": 88, "pid": 1336759, "tid": 1381173, "ts": 1295650783892.135, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650783893.341, "dur": 3.795, "args": { "External id": 18234,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650783896.391, "dur": 0.605, "args": { "External id": 18235,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 826 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650783902.540, "dur": 6.170, "args": { "External id": 18236,"Record function id": 0, "Sequence number": 246679, "Fwd thread id": 1, "Ev Idx": 827 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650783903.822, "dur": 2.839, "args": { "External id": 18237,"Sequence number": 246679, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 828 } }, { "ph": "f", "id": 89, "pid": 1336759, "tid": 1381173, "ts": 1295650783903.822, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650783904.708, "dur": 1.814, "args": { "External id": 18238,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650783905.784, "dur": 0.619, "args": { "External id": 18239,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 830 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650783912.037, "dur": 187.742, "args": { "External id": 18240,"Record function id": 0, "Sequence number": 246678, "Fwd thread id": 1, "Ev Idx": 831 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650783912.723, "dur": 178.210, "args": { "External id": 18241,"Sequence number": 246678, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 832 } }, { "ph": "f", "id": 90, "pid": 1336759, "tid": 1381173, "ts": 1295650783912.723, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650783915.554, "dur": 7.975, "args": { "External id": 18242,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650783917.126, "dur": 5.849, "args": { "External id": 18243,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650783921.234, "dur": 1.484, "args": { "External id": 18244,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650783924.935, "dur": 58.792, "args": { "External id": 18245,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650784025.234, "dur": 6.289, "args": { "External id": 18246,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650784026.350, "dur": 4.198, "args": { "External id": 18247,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650784028.778, "dur": 1.434, "args": { "External id": 18248,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650784033.573, "dur": 4.952, "args": { "External id": 18249,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650784034.413, "dur": 3.467, "args": { "External id": 18250,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650784037.381, "dur": 0.388, "args": { "External id": 18251,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650784039.491, "dur": 50.404, "args": { "External id": 18252,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 843 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784107.365, "dur": 7.901, "args": { "External id": 18253,"Record function id": 0, "Sequence number": 246677, "Fwd thread id": 1, "Ev Idx": 844 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784108.452, "dur": 4.847, "args": { "External id": 18254,"Sequence number": 246677, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 845 } }, { "ph": "f", "id": 91, "pid": 1336759, "tid": 1381173, "ts": 1295650784108.452, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650784110.572, "dur": 2.600, "args": { "External id": 18255,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650784111.652, "dur": 1.420, "args": { "External id": 18256,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 847 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784118.520, "dur": 8.793, "args": { "External id": 18257,"Record function id": 0, "Sequence number": 246676, "Fwd thread id": 1, "Ev Idx": 848 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784119.356, "dur": 6.382, "args": { "External id": 18258,"Sequence number": 246676, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 849 } }, { "ph": "f", "id": 92, "pid": 1336759, "tid": 1381173, "ts": 1295650784119.356, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650784120.049, "dur": 5.502, "args": { "External id": 18259,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650784122.740, "dur": 2.333, "args": { "External id": 18260,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650784124.493, "dur": 0.426, "args": { "External id": 18261,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 852 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650784133.563, "dur": 9.633, "args": { "External id": 18262,"Record function id": 0, "Ev Idx": 853 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650784135.604, "dur": 6.901, "args": { "External id": 18263,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650784138.246, "dur": 3.909, "args": { "External id": 18264,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 855 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650784139.536, "dur": 2.495, "args": { "External id": 18265,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 856 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784146.468, "dur": 6.325, "args": { "External id": 18266,"Record function id": 0, "Sequence number": 246675, "Fwd thread id": 1, "Ev Idx": 857 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784147.841, "dur": 2.879, "args": { "External id": 18267,"Sequence number": 246675, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 858 } }, { "ph": "f", "id": 93, "pid": 1336759, "tid": 1381173, "ts": 1295650784147.841, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650784148.782, "dur": 1.788, "args": { "External id": 18268,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650784149.616, "dur": 0.825, "args": { "External id": 18269,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 860 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784158.394, "dur": 101.554, "args": { "External id": 18270,"Record function id": 0, "Sequence number": 246674, "Fwd thread id": 1, "Ev Idx": 861 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784159.156, "dur": 94.189, "args": { "External id": 18271,"Sequence number": 246674, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 862 } }, { "ph": "f", "id": 94, "pid": 1336759, "tid": 1381173, "ts": 1295650784159.156, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650784161.262, "dur": 3.017, "args": { "External id": 18272,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650784161.636, "dur": 2.208, "args": { "External id": 18273,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650784163.301, "dur": 0.429, "args": { "External id": 18274,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650784164.975, "dur": 26.869, "args": { "External id": 18275,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650784192.798, "dur": 5.736, "args": { "External id": 18276,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650784195.403, "dur": 2.644, "args": { "External id": 18277,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650784196.868, "dur": 0.965, "args": { "External id": 18278,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650784199.807, "dur": 3.796, "args": { "External id": 18279,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650784200.375, "dur": 2.818, "args": { "External id": 18280,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650784201.788, "dur": 1.338, "args": { "External id": 18281,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650784204.200, "dur": 47.843, "args": { "External id": 18282,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 873 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784266.570, "dur": 36.144, "args": { "External id": 18283,"Record function id": 0, "Sequence number": 246673, "Fwd thread id": 1, "Ev Idx": 874 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784269.419, "dur": 5.211, "args": { "External id": 18284,"Sequence number": 246673, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 875 } }, { "ph": "f", "id": 95, "pid": 1336759, "tid": 1381173, "ts": 1295650784269.419, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650784271.407, "dur": 3.084, "args": { "External id": 18285,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650784272.679, "dur": 1.697, "args": { "External id": 18286,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336759, "tid": 1381173, "ts": 1295650784277.809, "dur": 22.905, "args": { "External id": 18287,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 878 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784306.487, "dur": 9.930, "args": { "External id": 18288,"Record function id": 0, "Sequence number": 246672, "Fwd thread id": 1, "Ev Idx": 879 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784307.705, "dur": 7.123, "args": { "External id": 18289,"Sequence number": 246672, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 880 } }, { "ph": "f", "id": 96, "pid": 1336759, "tid": 1381173, "ts": 1295650784307.705, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650784308.339, "dur": 6.291, "args": { "External id": 18290,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650784309.341, "dur": 4.697, "args": { "External id": 18291,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650784313.341, "dur": 0.577, "args": { "External id": 18292,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 883 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650784320.562, "dur": 5.695, "args": { "External id": 18293,"Record function id": 0, "Ev Idx": 884 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650784322.280, "dur": 3.486, "args": { "External id": 18294,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650784323.372, "dur": 2.031, "args": { "External id": 18295,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 886 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650784323.894, "dur": 1.394, "args": { "External id": 18296,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 887 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784329.890, "dur": 6.394, "args": { "External id": 18297,"Record function id": 0, "Sequence number": 246671, "Fwd thread id": 1, "Ev Idx": 888 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784331.294, "dur": 3.296, "args": { "External id": 18298,"Sequence number": 246671, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 889 } }, { "ph": "f", "id": 97, "pid": 1336759, "tid": 1381173, "ts": 1295650784331.294, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650784332.496, "dur": 1.923, "args": { "External id": 18299,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650784333.238, "dur": 1.021, "args": { "External id": 18300,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 891 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784341.403, "dur": 92.066, "args": { "External id": 18301,"Record function id": 0, "Sequence number": 246670, "Fwd thread id": 1, "Ev Idx": 892 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784343.627, "dur": 83.205, "args": { "External id": 18302,"Sequence number": 246670, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 893 } }, { "ph": "f", "id": 98, "pid": 1336759, "tid": 1381173, "ts": 1295650784343.627, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650784345.500, "dur": 3.181, "args": { "External id": 18303,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650784346.057, "dur": 2.121, "args": { "External id": 18304,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650784347.441, "dur": 0.637, "args": { "External id": 18305,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650784349.249, "dur": 29.225, "args": { "External id": 18306,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650784379.467, "dur": 5.264, "args": { "External id": 18307,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650784379.940, "dur": 4.209, "args": { "External id": 18308,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650784383.125, "dur": 0.906, "args": { "External id": 18309,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650784386.039, "dur": 6.542, "args": { "External id": 18310,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650784389.789, "dur": 2.370, "args": { "External id": 18311,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650784391.711, "dur": 0.344, "args": { "External id": 18312,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650784393.094, "dur": 32.906, "args": { "External id": 18313,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 904 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784438.185, "dur": 25.254, "args": { "External id": 18314,"Record function id": 0, "Sequence number": 246669, "Fwd thread id": 1, "Ev Idx": 905 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784439.162, "dur": 5.736, "args": { "External id": 18315,"Sequence number": 246669, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 906 } }, { "ph": "f", "id": 99, "pid": 1336759, "tid": 1381173, "ts": 1295650784439.162, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650784442.566, "dur": 2.185, "args": { "External id": 18316,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650784443.593, "dur": 1.033, "args": { "External id": 18317,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1381173, "ts": 1295650784447.199, "dur": 14.102, "args": { "External id": 18318,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 909 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784466.872, "dur": 7.491, "args": { "External id": 18319,"Record function id": 0, "Sequence number": 246668, "Fwd thread id": 1, "Ev Idx": 910 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784467.811, "dur": 4.652, "args": { "External id": 18320,"Sequence number": 246668, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 911 } }, { "ph": "f", "id": 100, "pid": 1336759, "tid": 1381173, "ts": 1295650784467.811, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650784468.745, "dur": 3.533, "args": { "External id": 18321,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650784469.492, "dur": 2.210, "args": { "External id": 18322,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650784471.079, "dur": 0.476, "args": { "External id": 18323,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 914 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650784478.362, "dur": 6.502, "args": { "External id": 18324,"Record function id": 0, "Ev Idx": 915 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650784479.792, "dur": 4.565, "args": { "External id": 18325,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650784480.504, "dur": 3.561, "args": { "External id": 18326,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 917 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650784483.082, "dur": 0.872, "args": { "External id": 18327,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 918 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650784489.206, "dur": 341.450, "args": { "External id": 18328,"Record function id": 0, "Sequence number": 246667, "Fwd thread id": 1, "Ev Idx": 919 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650784490.645, "dur": 313.881, "args": { "External id": 18329,"Sequence number": 246667, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 920 } }, { "ph": "f", "id": 101, "pid": 1336759, "tid": 1381173, "ts": 1295650784490.645, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650784524.153, "dur": 1.862, "args": { "External id": 18330,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650784524.848, "dur": 1.012, "args": { "External id": 18331,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650784539.681, "dur": 4.780, "args": { "External id": 18332,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650784556.097, "dur": 1.924, "args": { "External id": 18333,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650784701.263, "dur": 1.923, "args": { "External id": 18334,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1381173, "ts": 1295650784707.685, "dur": 34.048, "args": { "External id": 18335,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650784718.549, "dur": 0.873, "args": { "External id": 18336,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295650784751.810, "dur": 29.138, "args": { "External id": 18337,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295650784753.618, "dur": 27.076, "args": { "External id": 18338,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650784758.067, "dur": 5.071, "args": { "External id": 18339,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650784764.662, "dur": 15.558, "args": { "External id": 18340,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1381173, "ts": 1295650784787.191, "dur": 2.419, "args": { "External id": 18341,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650784788.514, "dur": 0.960, "args": { "External id": 18342,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650784795.844, "dur": 2.269, "args": { "External id": 18343,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650784797.138, "dur": 0.886, "args": { "External id": 18344,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1381173, "ts": 1295650784812.836, "dur": 14.020, "args": { "External id": 18345,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 936 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650784839.506, "dur": 9.811, "args": { "External id": 18346,"Record function id": 0, "Ev Idx": 937 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650784841.866, "dur": 6.789, "args": { "External id": 18347,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650784843.346, "dur": 4.302, "args": { "External id": 18348,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 939 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650784846.395, "dur": 1.127, "args": { "External id": 18349,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 940 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784853.139, "dur": 4.414, "args": { "External id": 18350,"Record function id": 0, "Sequence number": 246666, "Fwd thread id": 1, "Ev Idx": 941 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650784854.373, "dur": 0.883, "args": { "External id": 18351,"Sequence number": 246666, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 942 } }, { "ph": "f", "id": 102, "pid": 1336759, "tid": 1381173, "ts": 1295650784854.373, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650784861.316, "dur": 471.551, "args": { "External id": 18352,"Record function id": 0, "Sequence number": 246665, "Fwd thread id": 1, "Ev Idx": 943 } }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650784862.896, "dur": 459.158, "args": { "External id": 18353,"Sequence number": 246665, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 944 } }, { "ph": "f", "id": 103, "pid": 1336759, "tid": 1381173, "ts": 1295650784862.896, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650784890.591, "dur": 8.028, "args": { "External id": 18354,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336759, "tid": 1381173, "ts": 1295650784895.620, "dur": 2.745, "args": { "External id": 18355,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]", "[8192, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[33554432, 8192, 1], [], []], "Input Dims": [[16, 4096, 2048], [], []], "Ev Idx": 946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650784901.376, "dur": 6.267, "args": { "External id": 18356,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650784904.128, "dur": 2.996, "args": { "External id": 18357,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650784906.337, "dur": 0.618, "args": { "External id": 18358,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1381173, "ts": 1295650784911.208, "dur": 116.798, "args": { "External id": 18359,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8192, 1], [1, 5632], []], "Input Dims": [[65536, 2048], [5632, 2048], []], "Ev Idx": 950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650784911.927, "dur": 3.971, "args": { "External id": 18360,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 5632]], "Input Dims": [[5632, 2048]], "Ev Idx": 951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650784912.405, "dur": 3.038, "args": { "External id": 18361,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 5632], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650784913.681, "dur": 1.682, "args": { "External id": 18362,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[5632, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 5632], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1381173, "ts": 1295650784919.687, "dur": 107.734, "args": { "External id": 18363,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650784921.190, "dur": 104.800, "args": { "External id": 18364,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1381173, "ts": 1295650785033.922, "dur": 3.545, "args": { "External id": 18365,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [23068672, 5632, 1]], "Input Dims": [[65536, 5632], [16, 4096, 5632]], "Ev Idx": 956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650785035.653, "dur": 1.686, "args": { "External id": 18366,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650785070.256, "dur": 5.770, "args": { "External id": 18367,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650785077.204, "dur": 1.525, "args": { "External id": 18368,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650785079.759, "dur": 1.405, "args": { "External id": 18369,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650785119.325, "dur": 1.930, "args": { "External id": 18370,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650785120.092, "dur": 1.053, "args": { "External id": 18371,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 1336759, "tid": 1381173, "ts": 1295650785141.934, "dur": 160.562, "args": { "External id": 18372,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[8192, 1], [5632, 1]], []], "Input Dims": [[], [[65536, 2048], [65536, 5632]], []], "Ev Idx": 963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1381173, "ts": 1295650785147.253, "dur": 5.933, "args": { "External id": 18373,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650785151.444, "dur": 0.851, "args": { "External id": 18374,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048, 1]", "[8192, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650785155.219, "dur": 6.816, "args": { "External id": 18375,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8192, 1, 1], []], "Input Dims": [[65536, 2048, 1], []], "Ev Idx": 966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650785159.433, "dur": 1.864, "args": { "External id": 18376,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 65536]", "[1, 1, 8192]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[65536, 2048, 1], [], [], []], "Ev Idx": 967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1381173, "ts": 1295650785163.335, "dur": 2.690, "args": { "External id": 18377,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650785165.332, "dur": 0.330, "args": { "External id": 18378,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650785167.005, "dur": 3.138, "args": { "External id": 18379,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650785169.065, "dur": 0.603, "args": { "External id": 18380,"Record function id": 0, "Concrete Inputs": ["", "[1, 5632, 65536]", "[1, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1, 1], [], [], []], "Input Dims": [[65536, 5632, 1], [], [], []], "Ev Idx": 971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650785175.818, "dur": 2.881, "args": { "External id": 18381,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 8192], []], "Input Dims": [[2048, 1, 65536], []], "Ev Idx": 972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650785178.020, "dur": 0.312, "args": { "External id": 18382,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536, 1]", "[1, 8192, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 8192], [], [], []], "Input Dims": [[2048, 1, 65536], [], [], []], "Ev Idx": 973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650785179.783, "dur": 6.354, "args": { "External id": 18383,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 8192, 1], []], "Input Dims": [[2048, 65536, 1], []], "Ev Idx": 974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336759, "tid": 1381173, "ts": 1295650785184.349, "dur": 1.584, "args": { "External id": 18384,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]", "[2048, 1, 8192]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 8192, 1], [], []], "Input Dims": [[2048, 65536, 1], [], []], "Ev Idx": 975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650785187.584, "dur": 2.801, "args": { "External id": 18385,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 5632], []], "Input Dims": [[1, 5632, 65536], []], "Ev Idx": 976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650785189.735, "dur": 0.344, "args": { "External id": 18386,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 5632], [], [], []], "Input Dims": [[1, 5632, 65536], [], [], []], "Ev Idx": 977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650785191.084, "dur": 3.115, "args": { "External id": 18387,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650785191.964, "dur": 2.134, "args": { "External id": 18388,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295650785195.326, "dur": 89.299, "args": { "External id": 18389,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1, 8192], [369098752, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632]], "Ev Idx": 980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650785290.501, "dur": 3.234, "args": { "External id": 18390,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 5632, 1], []], "Input Dims": [[1, 2048, 5632], []], "Ev Idx": 981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650785294.929, "dur": 3.420, "args": { "External id": 18391,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 5632, 1], []], "Input Dims": [[2048, 1, 5632], []], "Ev Idx": 982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650785297.239, "dur": 0.559, "args": { "External id": 18392,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632, 1]", "[5632, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 5632, 1], [], [], []], "Input Dims": [[2048, 1, 5632], [], [], []], "Ev Idx": 983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650785300.636, "dur": 0.784, "args": { "External id": 18393,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 5632], []], "Input Dims": [[2048, 5632, 1], []], "Ev Idx": 984 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650785344.829, "dur": 9.153, "args": { "External id": 18394,"Record function id": 0, "Ev Idx": 985 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650785347.400, "dur": 5.698, "args": { "External id": 18395,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650785349.446, "dur": 2.818, "args": { "External id": 18396,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 987 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650785350.170, "dur": 1.992, "args": { "External id": 18397,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 988 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650785358.122, "dur": 6.949, "args": { "External id": 18398,"Record function id": 0, "Sequence number": 246664, "Fwd thread id": 1, "Ev Idx": 989 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650785359.349, "dur": 3.568, "args": { "External id": 18399,"Sequence number": 246664, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 990 } }, { "ph": "f", "id": 104, "pid": 1336759, "tid": 1381173, "ts": 1295650785359.349, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650785360.804, "dur": 1.863, "args": { "External id": 18400,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650785361.663, "dur": 0.871, "args": { "External id": 18401,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 992 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650785370.604, "dur": 172.184, "args": { "External id": 18402,"Record function id": 0, "Sequence number": 246663, "Fwd thread id": 1, "Ev Idx": 993 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650785371.664, "dur": 165.734, "args": { "External id": 18403,"Sequence number": 246663, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 994 } }, { "ph": "f", "id": 105, "pid": 1336759, "tid": 1381173, "ts": 1295650785371.664, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650785374.380, "dur": 4.208, "args": { "External id": 18404,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650785375.495, "dur": 2.519, "args": { "External id": 18405,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650785377.346, "dur": 0.501, "args": { "External id": 18406,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650785379.829, "dur": 59.720, "args": { "External id": 18407,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650785440.943, "dur": 5.863, "args": { "External id": 18408,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650785441.599, "dur": 4.373, "args": { "External id": 18409,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 1000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650785444.959, "dur": 0.868, "args": { "External id": 18410,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 1001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650785447.966, "dur": 3.097, "args": { "External id": 18411,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650785448.850, "dur": 1.785, "args": { "External id": 18412,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650785450.279, "dur": 0.254, "args": { "External id": 18413,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650785451.746, "dur": 84.939, "args": { "External id": 18414,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 1005 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650785547.549, "dur": 8.087, "args": { "External id": 18415,"Record function id": 0, "Sequence number": 246662, "Fwd thread id": 1, "Ev Idx": 1006 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650785548.451, "dur": 6.006, "args": { "External id": 18416,"Sequence number": 246662, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1007 } }, { "ph": "f", "id": 106, "pid": 1336759, "tid": 1381173, "ts": 1295650785548.451, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650785549.897, "dur": 4.407, "args": { "External id": 18417,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650785553.165, "dur": 1.045, "args": { "External id": 18418,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1009 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650785558.728, "dur": 7.062, "args": { "External id": 18419,"Record function id": 0, "Sequence number": 246661, "Fwd thread id": 1, "Ev Idx": 1010 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650785559.497, "dur": 4.041, "args": { "External id": 18420,"Sequence number": 246661, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1011 } }, { "ph": "f", "id": 107, "pid": 1336759, "tid": 1381173, "ts": 1295650785559.497, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650785560.206, "dur": 3.132, "args": { "External id": 18421,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650785560.803, "dur": 2.032, "args": { "External id": 18422,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650785562.323, "dur": 0.415, "args": { "External id": 18423,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1014 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650785569.810, "dur": 4.672, "args": { "External id": 18424,"Record function id": 0, "Ev Idx": 1015 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650785571.303, "dur": 2.639, "args": { "External id": 18425,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650785572.243, "dur": 1.442, "args": { "External id": 18426,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1017 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650785572.688, "dur": 0.872, "args": { "External id": 18427,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1018 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650785579.805, "dur": 7.928, "args": { "External id": 18428,"Record function id": 0, "Sequence number": 246660, "Fwd thread id": 1, "Ev Idx": 1019 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650785580.845, "dur": 5.215, "args": { "External id": 18429,"Sequence number": 246660, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 1020 } }, { "ph": "f", "id": 108, "pid": 1336759, "tid": 1381173, "ts": 1295650785580.845, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650785584.467, "dur": 1.439, "args": { "External id": 18430,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650785585.211, "dur": 0.571, "args": { "External id": 18431,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1022 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650785590.861, "dur": 184.437, "args": { "External id": 18432,"Record function id": 0, "Sequence number": 246659, "Fwd thread id": 1, "Ev Idx": 1023 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650785613.226, "dur": 155.284, "args": { "External id": 18433,"Sequence number": 246659, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1024 } }, { "ph": "f", "id": 109, "pid": 1336759, "tid": 1381173, "ts": 1295650785613.226, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650785614.748, "dur": 4.845, "args": { "External id": 18434,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650785615.205, "dur": 3.904, "args": { "External id": 18435,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 1026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650785618.400, "dur": 0.568, "args": { "External id": 18436,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 1027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650785620.216, "dur": 51.763, "args": { "External id": 18437,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 1028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650785673.089, "dur": 4.173, "args": { "External id": 18438,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650785673.550, "dur": 3.024, "args": { "External id": 18439,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 1030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650785674.962, "dur": 1.461, "args": { "External id": 18440,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 1031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650785678.130, "dur": 5.518, "args": { "External id": 18441,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650785678.809, "dur": 4.441, "args": { "External id": 18442,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650785681.744, "dur": 1.425, "args": { "External id": 18443,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650785684.170, "dur": 83.708, "args": { "External id": 18444,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 1035 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650785779.791, "dur": 29.844, "args": { "External id": 18445,"Record function id": 0, "Sequence number": 246658, "Fwd thread id": 1, "Ev Idx": 1036 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650785780.639, "dur": 4.022, "args": { "External id": 18446,"Sequence number": 246658, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1037 } }, { "ph": "f", "id": 110, "pid": 1336759, "tid": 1381173, "ts": 1295650785780.639, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650785782.139, "dur": 2.369, "args": { "External id": 18447,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650785783.244, "dur": 1.165, "args": { "External id": 18448,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336759, "tid": 1381173, "ts": 1295650785787.420, "dur": 19.678, "args": { "External id": 18449,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1040 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650785813.228, "dur": 9.086, "args": { "External id": 18450,"Record function id": 0, "Sequence number": 246657, "Fwd thread id": 1, "Ev Idx": 1041 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650785814.051, "dur": 6.143, "args": { "External id": 18451,"Sequence number": 246657, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1042 } }, { "ph": "f", "id": 111, "pid": 1336759, "tid": 1381173, "ts": 1295650785814.051, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650785816.531, "dur": 3.426, "args": { "External id": 18452,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650785817.173, "dur": 2.157, "args": { "External id": 18453,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650785818.780, "dur": 0.448, "args": { "External id": 18454,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1045 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650785826.213, "dur": 4.614, "args": { "External id": 18455,"Record function id": 0, "Ev Idx": 1046 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650785827.939, "dur": 2.410, "args": { "External id": 18456,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650785828.729, "dur": 1.329, "args": { "External id": 18457,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1048 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650785829.064, "dur": 0.882, "args": { "External id": 18458,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1049 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650785835.038, "dur": 480.982, "args": { "External id": 18459,"Record function id": 0, "Sequence number": 246656, "Fwd thread id": 1, "Ev Idx": 1050 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650785836.526, "dur": 443.830, "args": { "External id": 18460,"Sequence number": 246656, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 1051 } }, { "ph": "f", "id": 112, "pid": 1336759, "tid": 1381173, "ts": 1295650785836.526, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336759, "tid": 1381173, "ts": 1295650785857.942, "dur": 32.044, "args": { "External id": 18461,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1381173, "ts": 1295650785859.395, "dur": 30.344, "args": { "External id": 18462,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650785862.470, "dur": 5.360, "args": { "External id": 18463,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 1054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650785864.928, "dur": 2.372, "args": { "External id": 18464,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650785869.314, "dur": 19.944, "args": { "External id": 18465,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650785901.436, "dur": 2.048, "args": { "External id": 18466,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650785902.235, "dur": 1.120, "args": { "External id": 18467,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650785906.808, "dur": 2.326, "args": { "External id": 18468,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650785907.441, "dur": 1.607, "args": { "External id": 18469,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650785922.436, "dur": 2.223, "args": { "External id": 18470,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650785935.191, "dur": 1.728, "args": { "External id": 18471,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650786148.966, "dur": 3.626, "args": { "External id": 18472,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 1063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1381173, "ts": 1295650786157.189, "dur": 34.072, "args": { "External id": 18473,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 1064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650786167.656, "dur": 1.048, "args": { "External id": 18474,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 1065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295650786197.270, "dur": 29.437, "args": { "External id": 18475,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 1066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295650786199.106, "dur": 27.356, "args": { "External id": 18476,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 1067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650786203.607, "dur": 3.806, "args": { "External id": 18477,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650786210.947, "dur": 14.978, "args": { "External id": 18478,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 1069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1381173, "ts": 1295650786248.160, "dur": 3.373, "args": { "External id": 18479,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 1070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650786249.685, "dur": 1.606, "args": { "External id": 18480,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 1071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650786259.275, "dur": 2.725, "args": { "External id": 18481,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650786260.580, "dur": 1.267, "args": { "External id": 18482,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650786264.564, "dur": 3.568, "args": { "External id": 18483,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650786265.829, "dur": 2.209, "args": { "External id": 18484,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1381173, "ts": 1295650786295.475, "dur": 18.927, "args": { "External id": 18485,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1076 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650786330.592, "dur": 9.591, "args": { "External id": 18486,"Record function id": 0, "Ev Idx": 1077 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650786333.133, "dur": 6.201, "args": { "External id": 18487,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650786335.299, "dur": 3.083, "args": { "External id": 18488,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1079 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650786336.243, "dur": 2.054, "args": { "External id": 18489,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1080 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650786344.022, "dur": 7.939, "args": { "External id": 18490,"Record function id": 0, "Sequence number": 246655, "Fwd thread id": 1, "Ev Idx": 1081 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650786345.426, "dur": 4.326, "args": { "External id": 18491,"Sequence number": 246655, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1082 } }, { "ph": "f", "id": 113, "pid": 1336759, "tid": 1381173, "ts": 1295650786345.426, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650786347.317, "dur": 2.200, "args": { "External id": 18492,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650786348.382, "dur": 1.004, "args": { "External id": 18493,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1084 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650786357.620, "dur": 123.435, "args": { "External id": 18494,"Record function id": 0, "Sequence number": 246654, "Fwd thread id": 1, "Ev Idx": 1085 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650786358.526, "dur": 116.080, "args": { "External id": 18495,"Sequence number": 246654, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1086 } }, { "ph": "f", "id": 114, "pid": 1336759, "tid": 1381173, "ts": 1295650786358.526, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650786361.255, "dur": 5.609, "args": { "External id": 18496,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650786362.868, "dur": 3.411, "args": { "External id": 18497,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650786364.835, "dur": 1.207, "args": { "External id": 18498,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650786368.030, "dur": 53.909, "args": { "External id": 18499,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650786423.059, "dur": 6.857, "args": { "External id": 18500,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650786425.581, "dur": 3.646, "args": { "External id": 18501,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650786427.254, "dur": 1.798, "args": { "External id": 18502,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650786431.341, "dur": 3.743, "args": { "External id": 18503,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650786432.310, "dur": 2.316, "args": { "External id": 18504,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650786434.043, "dur": 0.477, "args": { "External id": 18505,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650786435.685, "dur": 38.109, "args": { "External id": 18506,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1097 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650786486.054, "dur": 11.617, "args": { "External id": 18507,"Record function id": 0, "Sequence number": 246653, "Fwd thread id": 1, "Ev Idx": 1098 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650786487.326, "dur": 7.948, "args": { "External id": 18508,"Sequence number": 246653, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1099 } }, { "ph": "f", "id": 115, "pid": 1336759, "tid": 1381173, "ts": 1295650786487.326, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650786491.203, "dur": 3.918, "args": { "External id": 18509,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650786492.482, "dur": 2.535, "args": { "External id": 18510,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1101 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650786501.225, "dur": 7.475, "args": { "External id": 18511,"Record function id": 0, "Sequence number": 246652, "Fwd thread id": 1, "Ev Idx": 1102 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650786501.951, "dur": 4.759, "args": { "External id": 18512,"Sequence number": 246652, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1103 } }, { "ph": "f", "id": 116, "pid": 1336759, "tid": 1381173, "ts": 1295650786501.951, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650786502.770, "dur": 3.737, "args": { "External id": 18513,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650786503.590, "dur": 2.424, "args": { "External id": 18514,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650786505.466, "dur": 0.461, "args": { "External id": 18515,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1106 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650786512.761, "dur": 7.287, "args": { "External id": 18516,"Record function id": 0, "Ev Idx": 1107 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650786514.514, "dur": 4.971, "args": { "External id": 18517,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650786515.439, "dur": 3.806, "args": { "External id": 18518,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1109 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650786518.176, "dur": 0.955, "args": { "External id": 18519,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1110 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650786525.120, "dur": 5.694, "args": { "External id": 18520,"Record function id": 0, "Sequence number": 246651, "Fwd thread id": 1, "Ev Idx": 1111 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650786525.827, "dur": 3.453, "args": { "External id": 18521,"Sequence number": 246651, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1112 } }, { "ph": "f", "id": 117, "pid": 1336759, "tid": 1381173, "ts": 1295650786525.827, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650786527.003, "dur": 2.116, "args": { "External id": 18522,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650786527.774, "dur": 1.194, "args": { "External id": 18523,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1114 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650786534.627, "dur": 275.508, "args": { "External id": 18524,"Record function id": 0, "Sequence number": 246650, "Fwd thread id": 1, "Ev Idx": 1115 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650786536.306, "dur": 258.581, "args": { "External id": 18525,"Sequence number": 246650, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1116 } }, { "ph": "f", "id": 118, "pid": 1336759, "tid": 1381173, "ts": 1295650786536.306, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650786549.589, "dur": 7.429, "args": { "External id": 18526,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650786552.877, "dur": 3.641, "args": { "External id": 18527,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650786559.012, "dur": 4.123, "args": { "External id": 18528,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650786560.660, "dur": 2.255, "args": { "External id": 18529,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650786572.503, "dur": 5.488, "args": { "External id": 18530,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650786576.265, "dur": 1.446, "args": { "External id": 18531,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1122 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650786602.201, "dur": 167.845, "args": { "External id": 18532,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650786680.917, "dur": 3.871, "args": { "External id": 18533,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650786686.684, "dur": 3.292, "args": { "External id": 18534,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336759, "tid": 1381173, "ts": 1295650786782.873, "dur": 3.201, "args": { "External id": 18535,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336759, "tid": 1381173, "ts": 1295650786788.974, "dur": 0.786, "args": { "External id": 18536,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336759, "tid": 1381173, "ts": 1295650786791.583, "dur": 0.648, "args": { "External id": 18537,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1128 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650786817.190, "dur": 266.029, "args": { "External id": 18538,"Record function id": 0, "Sequence number": 246649, "Fwd thread id": 1, "Ev Idx": 1129 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650786819.217, "dur": 255.414, "args": { "External id": 18539,"Sequence number": 246649, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1130 } }, { "ph": "f", "id": 119, "pid": 1336759, "tid": 1381173, "ts": 1295650786819.217, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1381173, "ts": 1295650786838.083, "dur": 43.252, "args": { "External id": 18540,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650786840.917, "dur": 3.029, "args": { "External id": 18541,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650786845.401, "dur": 35.346, "args": { "External id": 18542,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 1133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650786890.114, "dur": 4.481, "args": { "External id": 18543,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650786891.995, "dur": 2.246, "args": { "External id": 18544,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1135 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650787093.045, "dur": 195.787, "args": { "External id": 18545,"Record function id": 0, "Sequence number": 246648, "Fwd thread id": 1, "Ev Idx": 1136 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650787095.569, "dur": 186.160, "args": { "External id": 18546,"Sequence number": 246648, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1137 } }, { "ph": "f", "id": 120, "pid": 1336759, "tid": 1381173, "ts": 1295650787095.569, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1381173, "ts": 1295650787109.426, "dur": 46.169, "args": { "External id": 18547,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650787112.605, "dur": 4.040, "args": { "External id": 18548,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650787121.347, "dur": 33.728, "args": { "External id": 18549,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 1140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650787164.196, "dur": 4.354, "args": { "External id": 18550,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650787166.426, "dur": 1.787, "args": { "External id": 18551,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1142 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787299.561, "dur": 16.480, "args": { "External id": 18552,"Record function id": 0, "Sequence number": 246647, "Fwd thread id": 1, "Ev Idx": 1143 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787301.306, "dur": 12.007, "args": { "External id": 18553,"Sequence number": 246647, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1144 } }, { "ph": "f", "id": 121, "pid": 1336759, "tid": 1381173, "ts": 1295650787301.306, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650787304.052, "dur": 8.958, "args": { "External id": 18554,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650787305.665, "dur": 7.141, "args": { "External id": 18555,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1146 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787319.569, "dur": 5.954, "args": { "External id": 18556,"Record function id": 0, "Sequence number": 246646, "Fwd thread id": 1, "Ev Idx": 1147 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787320.501, "dur": 3.593, "args": { "External id": 18557,"Sequence number": 246646, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1148 } }, { "ph": "f", "id": 122, "pid": 1336759, "tid": 1381173, "ts": 1295650787320.501, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650787321.719, "dur": 2.225, "args": { "External id": 18558,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650787322.899, "dur": 0.931, "args": { "External id": 18559,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1150 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787328.640, "dur": 7.721, "args": { "External id": 18560,"Record function id": 0, "Sequence number": 246645, "Fwd thread id": 1, "Ev Idx": 1151 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787329.510, "dur": 5.235, "args": { "External id": 18561,"Sequence number": 246645, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1152 } }, { "ph": "f", "id": 123, "pid": 1336759, "tid": 1381173, "ts": 1295650787329.510, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650787332.962, "dur": 1.648, "args": { "External id": 18562,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650787333.736, "dur": 0.747, "args": { "External id": 18563,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1154 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787340.135, "dur": 5.827, "args": { "External id": 18564,"Record function id": 0, "Sequence number": 246644, "Fwd thread id": 1, "Ev Idx": 1155 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787341.337, "dur": 3.084, "args": { "External id": 18565,"Sequence number": 246644, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1156 } }, { "ph": "f", "id": 124, "pid": 1336759, "tid": 1381173, "ts": 1295650787341.337, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650787342.676, "dur": 1.607, "args": { "External id": 18566,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650787343.285, "dur": 0.871, "args": { "External id": 18567,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1158 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787349.416, "dur": 150.909, "args": { "External id": 18568,"Record function id": 0, "Sequence number": 246643, "Fwd thread id": 1, "Ev Idx": 1159 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787350.362, "dur": 143.590, "args": { "External id": 18569,"Sequence number": 246643, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1160 } }, { "ph": "f", "id": 125, "pid": 1336759, "tid": 1381173, "ts": 1295650787350.362, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650787353.963, "dur": 9.224, "args": { "External id": 18570,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650787358.007, "dur": 4.497, "args": { "External id": 18571,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650787360.575, "dur": 1.584, "args": { "External id": 18572,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650787364.835, "dur": 69.891, "args": { "External id": 18573,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650787436.050, "dur": 4.915, "args": { "External id": 18574,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650787436.751, "dur": 3.569, "args": { "External id": 18575,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650787438.977, "dur": 1.147, "args": { "External id": 18576,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650787442.608, "dur": 5.946, "args": { "External id": 18577,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650787445.720, "dur": 2.325, "args": { "External id": 18578,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650787447.651, "dur": 0.315, "args": { "External id": 18579,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650787449.149, "dur": 43.985, "args": { "External id": 18580,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1171 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787507.961, "dur": 7.190, "args": { "External id": 18581,"Record function id": 0, "Sequence number": 246642, "Fwd thread id": 1, "Ev Idx": 1172 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787508.835, "dur": 4.504, "args": { "External id": 18582,"Sequence number": 246642, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1173 } }, { "ph": "f", "id": 126, "pid": 1336759, "tid": 1381173, "ts": 1295650787508.835, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650787510.569, "dur": 2.628, "args": { "External id": 18583,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650787511.878, "dur": 1.210, "args": { "External id": 18584,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1175 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787518.268, "dur": 9.004, "args": { "External id": 18585,"Record function id": 0, "Sequence number": 246641, "Fwd thread id": 1, "Ev Idx": 1176 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787519.011, "dur": 6.582, "args": { "External id": 18586,"Sequence number": 246641, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1177 } }, { "ph": "f", "id": 127, "pid": 1336759, "tid": 1381173, "ts": 1295650787519.011, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650787521.784, "dur": 3.593, "args": { "External id": 18587,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650787522.593, "dur": 2.301, "args": { "External id": 18588,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650787524.285, "dur": 0.427, "args": { "External id": 18589,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1180 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650787533.479, "dur": 9.552, "args": { "External id": 18590,"Record function id": 0, "Ev Idx": 1181 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650787535.389, "dur": 6.821, "args": { "External id": 18591,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650787537.737, "dur": 4.020, "args": { "External id": 18592,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1183 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650787539.051, "dur": 2.636, "args": { "External id": 18593,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1184 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787546.835, "dur": 7.464, "args": { "External id": 18594,"Record function id": 0, "Sequence number": 246640, "Fwd thread id": 1, "Ev Idx": 1185 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787548.193, "dur": 4.698, "args": { "External id": 18595,"Sequence number": 246640, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1186 } }, { "ph": "f", "id": 128, "pid": 1336759, "tid": 1381173, "ts": 1295650787548.193, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650787549.073, "dur": 3.664, "args": { "External id": 18596,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650787551.865, "dur": 0.739, "args": { "External id": 18597,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1188 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787557.470, "dur": 89.901, "args": { "External id": 18598,"Record function id": 0, "Sequence number": 246639, "Fwd thread id": 1, "Ev Idx": 1189 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787558.144, "dur": 83.807, "args": { "External id": 18599,"Sequence number": 246639, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1190 } }, { "ph": "f", "id": 129, "pid": 1336759, "tid": 1381173, "ts": 1295650787558.144, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650787560.244, "dur": 3.672, "args": { "External id": 18600,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650787560.830, "dur": 2.645, "args": { "External id": 18601,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650787562.857, "dur": 0.475, "args": { "External id": 18602,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650787564.740, "dur": 26.563, "args": { "External id": 18603,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650787594.259, "dur": 4.015, "args": { "External id": 18604,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650787594.774, "dur": 2.895, "args": { "External id": 18605,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650787596.538, "dur": 0.995, "args": { "External id": 18606,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650787599.475, "dur": 4.426, "args": { "External id": 18607,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650787600.499, "dur": 2.944, "args": { "External id": 18608,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650787601.963, "dur": 1.378, "args": { "External id": 18609,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650787606.393, "dur": 34.941, "args": { "External id": 18610,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1201 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787651.717, "dur": 32.226, "args": { "External id": 18611,"Record function id": 0, "Sequence number": 246638, "Fwd thread id": 1, "Ev Idx": 1202 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787652.645, "dur": 4.051, "args": { "External id": 18612,"Sequence number": 246638, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1203 } }, { "ph": "f", "id": 130, "pid": 1336759, "tid": 1381173, "ts": 1295650787652.645, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650787654.436, "dur": 2.116, "args": { "External id": 18613,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650787655.425, "dur": 1.009, "args": { "External id": 18614,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336759, "tid": 1381173, "ts": 1295650787659.778, "dur": 21.865, "args": { "External id": 18615,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1206 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787687.443, "dur": 9.747, "args": { "External id": 18616,"Record function id": 0, "Sequence number": 246637, "Fwd thread id": 1, "Ev Idx": 1207 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787688.337, "dur": 6.955, "args": { "External id": 18617,"Sequence number": 246637, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1208 } }, { "ph": "f", "id": 131, "pid": 1336759, "tid": 1381173, "ts": 1295650787688.337, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650787688.988, "dur": 6.078, "args": { "External id": 18618,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650787692.268, "dur": 2.233, "args": { "External id": 18619,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650787693.986, "dur": 0.396, "args": { "External id": 18620,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1211 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650787701.211, "dur": 4.952, "args": { "External id": 18621,"Record function id": 0, "Ev Idx": 1212 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650787702.845, "dur": 2.835, "args": { "External id": 18622,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650787703.768, "dur": 1.506, "args": { "External id": 18623,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1214 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650787704.119, "dur": 1.082, "args": { "External id": 18624,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1215 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787709.675, "dur": 9.607, "args": { "External id": 18625,"Record function id": 0, "Sequence number": 246636, "Fwd thread id": 1, "Ev Idx": 1216 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787711.128, "dur": 6.207, "args": { "External id": 18626,"Sequence number": 246636, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1217 } }, { "ph": "f", "id": 132, "pid": 1336759, "tid": 1381173, "ts": 1295650787711.128, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650787712.547, "dur": 4.633, "args": { "External id": 18627,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650787716.137, "dur": 0.938, "args": { "External id": 18628,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1219 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787724.544, "dur": 83.028, "args": { "External id": 18629,"Record function id": 0, "Sequence number": 246635, "Fwd thread id": 1, "Ev Idx": 1220 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787725.269, "dur": 75.688, "args": { "External id": 18630,"Sequence number": 246635, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1221 } }, { "ph": "f", "id": 133, "pid": 1336759, "tid": 1381173, "ts": 1295650787725.269, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650787726.886, "dur": 3.608, "args": { "External id": 18631,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650787727.333, "dur": 2.720, "args": { "External id": 18632,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650787729.259, "dur": 0.690, "args": { "External id": 18633,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650787731.304, "dur": 24.688, "args": { "External id": 18634,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650787756.980, "dur": 6.532, "args": { "External id": 18635,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650787759.482, "dur": 3.422, "args": { "External id": 18636,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650787761.162, "dur": 1.530, "args": { "External id": 18637,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650787764.446, "dur": 3.100, "args": { "External id": 18638,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650787765.418, "dur": 1.751, "args": { "External id": 18639,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650787766.771, "dur": 0.281, "args": { "External id": 18640,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650787768.072, "dur": 32.012, "args": { "External id": 18641,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1232 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787811.599, "dur": 26.041, "args": { "External id": 18642,"Record function id": 0, "Sequence number": 246634, "Fwd thread id": 1, "Ev Idx": 1233 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787812.642, "dur": 6.674, "args": { "External id": 18643,"Sequence number": 246634, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1234 } }, { "ph": "f", "id": 134, "pid": 1336759, "tid": 1381173, "ts": 1295650787812.642, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650787816.757, "dur": 2.418, "args": { "External id": 18644,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650787817.917, "dur": 1.109, "args": { "External id": 18645,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1381173, "ts": 1295650787821.577, "dur": 14.383, "args": { "External id": 18646,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1237 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787841.031, "dur": 7.485, "args": { "External id": 18647,"Record function id": 0, "Sequence number": 246633, "Fwd thread id": 1, "Ev Idx": 1238 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650787841.753, "dur": 5.001, "args": { "External id": 18648,"Sequence number": 246633, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1239 } }, { "ph": "f", "id": 135, "pid": 1336759, "tid": 1381173, "ts": 1295650787841.753, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650787842.844, "dur": 3.728, "args": { "External id": 18649,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650787843.724, "dur": 2.334, "args": { "External id": 18650,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650787845.513, "dur": 0.411, "args": { "External id": 18651,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1242 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650787852.480, "dur": 6.853, "args": { "External id": 18652,"Record function id": 0, "Ev Idx": 1243 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650787854.364, "dur": 4.529, "args": { "External id": 18653,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650787855.155, "dur": 3.405, "args": { "External id": 18654,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1245 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650787857.736, "dur": 0.739, "args": { "External id": 18655,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1246 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650787865.537, "dur": 405.856, "args": { "External id": 18656,"Record function id": 0, "Sequence number": 246632, "Fwd thread id": 1, "Ev Idx": 1247 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650787867.081, "dur": 353.824, "args": { "External id": 18657,"Sequence number": 246632, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1248 } }, { "ph": "f", "id": 136, "pid": 1336759, "tid": 1381173, "ts": 1295650787867.081, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650787896.457, "dur": 2.241, "args": { "External id": 18658,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650787897.419, "dur": 1.134, "args": { "External id": 18659,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650787912.249, "dur": 4.826, "args": { "External id": 18660,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650787925.888, "dur": 1.880, "args": { "External id": 18661,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650788114.911, "dur": 3.194, "args": { "External id": 18662,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 1253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1381173, "ts": 1295650788122.554, "dur": 38.276, "args": { "External id": 18663,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 1254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788133.659, "dur": 0.987, "args": { "External id": 18664,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 1255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295650788166.778, "dur": 28.855, "args": { "External id": 18665,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 1256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295650788168.439, "dur": 27.022, "args": { "External id": 18666,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 1257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788173.223, "dur": 4.899, "args": { "External id": 18667,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650788179.728, "dur": 15.291, "args": { "External id": 18668,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 1259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1381173, "ts": 1295650788200.233, "dur": 5.157, "args": { "External id": 18669,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 1260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650788203.894, "dur": 1.363, "args": { "External id": 18670,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 1261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650788211.993, "dur": 2.598, "args": { "External id": 18671,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650788213.053, "dur": 1.447, "args": { "External id": 18672,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1381173, "ts": 1295650788248.638, "dur": 17.746, "args": { "External id": 18673,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1264 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650788284.091, "dur": 10.149, "args": { "External id": 18674,"Record function id": 0, "Ev Idx": 1265 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650788287.084, "dur": 6.348, "args": { "External id": 18675,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650788289.208, "dur": 3.316, "args": { "External id": 18676,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1267 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650788290.384, "dur": 2.021, "args": { "External id": 18677,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1268 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650788298.181, "dur": 6.852, "args": { "External id": 18678,"Record function id": 0, "Sequence number": 246631, "Fwd thread id": 1, "Ev Idx": 1269 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650788301.148, "dur": 1.204, "args": { "External id": 18679,"Sequence number": 246631, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1270 } }, { "ph": "f", "id": 137, "pid": 1336759, "tid": 1381173, "ts": 1295650788301.148, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650788309.145, "dur": 391.108, "args": { "External id": 18680,"Record function id": 0, "Sequence number": 246630, "Fwd thread id": 1, "Ev Idx": 1271 } }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650788310.654, "dur": 379.170, "args": { "External id": 18681,"Sequence number": 246630, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1272 } }, { "ph": "f", "id": 138, "pid": 1336759, "tid": 1381173, "ts": 1295650788310.654, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650788342.241, "dur": 8.531, "args": { "External id": 18682,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336759, "tid": 1381173, "ts": 1295650788347.404, "dur": 3.066, "args": { "External id": 18683,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]", "[8192, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[33554432, 8192, 1], [], []], "Input Dims": [[16, 4096, 2048], [], []], "Ev Idx": 1274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650788353.976, "dur": 7.524, "args": { "External id": 18684,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650788355.193, "dur": 5.659, "args": { "External id": 18685,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788359.558, "dur": 1.114, "args": { "External id": 18686,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1381173, "ts": 1295650788365.134, "dur": 85.333, "args": { "External id": 18687,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8192, 1], [1, 5632], []], "Input Dims": [[65536, 2048], [5632, 2048], []], "Ev Idx": 1278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650788365.905, "dur": 4.135, "args": { "External id": 18688,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 5632]], "Input Dims": [[5632, 2048]], "Ev Idx": 1279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650788366.507, "dur": 3.064, "args": { "External id": 18689,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 5632], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 1280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788367.858, "dur": 1.564, "args": { "External id": 18690,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[5632, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 5632], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 1281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1381173, "ts": 1295650788371.203, "dur": 78.759, "args": { "External id": 18691,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 1282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650788372.694, "dur": 76.457, "args": { "External id": 18692,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 1283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1381173, "ts": 1295650788456.206, "dur": 3.161, "args": { "External id": 18693,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [23068672, 5632, 1]], "Input Dims": [[65536, 5632], [16, 4096, 5632]], "Ev Idx": 1284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650788457.712, "dur": 1.507, "args": { "External id": 18694,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 1285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650788492.369, "dur": 4.922, "args": { "External id": 18695,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650788498.710, "dur": 1.610, "args": { "External id": 18696,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650788501.683, "dur": 1.487, "args": { "External id": 18697,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650788535.089, "dur": 2.250, "args": { "External id": 18698,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650788536.117, "dur": 1.073, "args": { "External id": 18699,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 1336759, "tid": 1381173, "ts": 1295650788557.416, "dur": 113.526, "args": { "External id": 18700,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[8192, 1], [5632, 1]], []], "Input Dims": [[], [[65536, 2048], [65536, 5632]], []], "Ev Idx": 1291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1381173, "ts": 1295650788562.076, "dur": 6.091, "args": { "External id": 18701,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788565.834, "dur": 1.458, "args": { "External id": 18702,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048, 1]", "[8192, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650788570.051, "dur": 6.422, "args": { "External id": 18703,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8192, 1, 1], []], "Input Dims": [[65536, 2048, 1], []], "Ev Idx": 1294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788574.004, "dur": 1.710, "args": { "External id": 18704,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 65536]", "[1, 1, 8192]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[65536, 2048, 1], [], [], []], "Ev Idx": 1295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1381173, "ts": 1295650788577.676, "dur": 2.503, "args": { "External id": 18705,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 1296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788579.427, "dur": 0.311, "args": { "External id": 18706,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 1297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650788581.286, "dur": 3.406, "args": { "External id": 18707,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 1298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788583.606, "dur": 0.560, "args": { "External id": 18708,"Record function id": 0, "Concrete Inputs": ["", "[1, 5632, 65536]", "[1, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1, 1], [], [], []], "Input Dims": [[65536, 5632, 1], [], [], []], "Ev Idx": 1299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650788590.568, "dur": 2.826, "args": { "External id": 18709,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 8192], []], "Input Dims": [[2048, 1, 65536], []], "Ev Idx": 1300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788592.606, "dur": 0.473, "args": { "External id": 18710,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536, 1]", "[1, 8192, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 8192], [], [], []], "Input Dims": [[2048, 1, 65536], [], [], []], "Ev Idx": 1301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650788594.594, "dur": 5.127, "args": { "External id": 18711,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 8192, 1], []], "Input Dims": [[2048, 65536, 1], []], "Ev Idx": 1302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336759, "tid": 1381173, "ts": 1295650788598.077, "dur": 1.460, "args": { "External id": 18712,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]", "[2048, 1, 8192]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 8192, 1], [], []], "Input Dims": [[2048, 65536, 1], [], []], "Ev Idx": 1303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650788600.903, "dur": 2.637, "args": { "External id": 18713,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 5632], []], "Input Dims": [[1, 5632, 65536], []], "Ev Idx": 1304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788602.896, "dur": 0.371, "args": { "External id": 18714,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 5632], [], [], []], "Input Dims": [[1, 5632, 65536], [], [], []], "Ev Idx": 1305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650788604.478, "dur": 3.656, "args": { "External id": 18715,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 1306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650788605.519, "dur": 2.513, "args": { "External id": 18716,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 1307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295650788609.558, "dur": 48.569, "args": { "External id": 18717,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1, 8192], [369098752, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632]], "Ev Idx": 1308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650788660.195, "dur": 2.069, "args": { "External id": 18718,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 5632, 1], []], "Input Dims": [[1, 2048, 5632], []], "Ev Idx": 1309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336759, "tid": 1381173, "ts": 1295650788663.550, "dur": 3.338, "args": { "External id": 18719,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 5632, 1], []], "Input Dims": [[2048, 1, 5632], []], "Ev Idx": 1310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788665.978, "dur": 0.487, "args": { "External id": 18720,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632, 1]", "[5632, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 5632, 1], [], [], []], "Input Dims": [[2048, 1, 5632], [], [], []], "Ev Idx": 1311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650788668.897, "dur": 0.974, "args": { "External id": 18721,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 5632], []], "Input Dims": [[2048, 5632, 1], []], "Ev Idx": 1312 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650788708.732, "dur": 7.573, "args": { "External id": 18722,"Record function id": 0, "Ev Idx": 1313 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650788711.239, "dur": 4.386, "args": { "External id": 18723,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650788712.600, "dur": 2.262, "args": { "External id": 18724,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1315 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650788713.252, "dur": 1.490, "args": { "External id": 18725,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1316 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650788720.228, "dur": 7.246, "args": { "External id": 18726,"Record function id": 0, "Sequence number": 246629, "Fwd thread id": 1, "Ev Idx": 1317 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650788721.780, "dur": 3.775, "args": { "External id": 18727,"Sequence number": 246629, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 1318 } }, { "ph": "f", "id": 139, "pid": 1336759, "tid": 1381173, "ts": 1295650788721.780, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650788723.426, "dur": 1.938, "args": { "External id": 18728,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650788724.240, "dur": 0.992, "args": { "External id": 18729,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1320 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650788731.222, "dur": 114.995, "args": { "External id": 18730,"Record function id": 0, "Sequence number": 246628, "Fwd thread id": 1, "Ev Idx": 1321 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650788732.143, "dur": 108.441, "args": { "External id": 18731,"Sequence number": 246628, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1322 } }, { "ph": "f", "id": 140, "pid": 1336759, "tid": 1381173, "ts": 1295650788732.143, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650788736.584, "dur": 3.796, "args": { "External id": 18732,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650788737.589, "dur": 2.295, "args": { "External id": 18733,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 1324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788739.155, "dur": 0.595, "args": { "External id": 18734,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 1325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650788741.447, "dur": 38.048, "args": { "External id": 18735,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 1326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650788780.677, "dur": 5.464, "args": { "External id": 18736,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650788781.239, "dur": 4.222, "args": { "External id": 18737,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 1328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788784.557, "dur": 0.738, "args": { "External id": 18738,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 1329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650788787.503, "dur": 4.287, "args": { "External id": 18739,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650788788.571, "dur": 2.471, "args": { "External id": 18740,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788790.494, "dur": 0.481, "args": { "External id": 18741,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650788792.330, "dur": 47.484, "args": { "External id": 18742,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 1333 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650788850.945, "dur": 8.636, "args": { "External id": 18743,"Record function id": 0, "Sequence number": 246627, "Fwd thread id": 1, "Ev Idx": 1334 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650788851.947, "dur": 6.347, "args": { "External id": 18744,"Sequence number": 246627, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1335 } }, { "ph": "f", "id": 141, "pid": 1336759, "tid": 1381173, "ts": 1295650788851.947, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650788853.897, "dur": 4.236, "args": { "External id": 18745,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650788856.984, "dur": 1.046, "args": { "External id": 18746,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1337 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650788863.025, "dur": 7.324, "args": { "External id": 18747,"Record function id": 0, "Sequence number": 246626, "Fwd thread id": 1, "Ev Idx": 1338 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650788863.921, "dur": 4.353, "args": { "External id": 18748,"Sequence number": 246626, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1339 } }, { "ph": "f", "id": 142, "pid": 1336759, "tid": 1381173, "ts": 1295650788863.921, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650788864.743, "dur": 3.307, "args": { "External id": 18749,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650788865.304, "dur": 2.247, "args": { "External id": 18750,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788867.016, "dur": 0.386, "args": { "External id": 18751,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1342 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650788874.303, "dur": 5.380, "args": { "External id": 18752,"Record function id": 0, "Ev Idx": 1343 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650788876.202, "dur": 3.003, "args": { "External id": 18753,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650788877.199, "dur": 1.759, "args": { "External id": 18754,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1345 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650788877.823, "dur": 1.039, "args": { "External id": 18755,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1346 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650788882.803, "dur": 7.920, "args": { "External id": 18756,"Record function id": 0, "Sequence number": 246625, "Fwd thread id": 1, "Ev Idx": 1347 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650788884.140, "dur": 4.931, "args": { "External id": 18757,"Sequence number": 246625, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 1348 } }, { "ph": "f", "id": 143, "pid": 1336759, "tid": 1381173, "ts": 1295650788884.140, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650788887.082, "dur": 1.851, "args": { "External id": 18758,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650788888.005, "dur": 0.800, "args": { "External id": 18759,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1350 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650788893.845, "dur": 151.008, "args": { "External id": 18760,"Record function id": 0, "Sequence number": 246624, "Fwd thread id": 1, "Ev Idx": 1351 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650788894.646, "dur": 140.592, "args": { "External id": 18761,"Sequence number": 246624, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1352 } }, { "ph": "f", "id": 144, "pid": 1336759, "tid": 1381173, "ts": 1295650788894.646, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650788896.421, "dur": 4.994, "args": { "External id": 18762,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650788896.897, "dur": 4.081, "args": { "External id": 18763,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 1354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788900.245, "dur": 0.603, "args": { "External id": 18764,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 1355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650788902.014, "dur": 31.185, "args": { "External id": 18765,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 1356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650788934.317, "dur": 3.610, "args": { "External id": 18766,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650788935.037, "dur": 2.291, "args": { "External id": 18767,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 1358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788936.452, "dur": 0.669, "args": { "External id": 18768,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 1359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650788938.941, "dur": 6.184, "args": { "External id": 18769,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650788939.878, "dur": 4.825, "args": { "External id": 18770,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650788943.060, "dur": 1.577, "args": { "External id": 18771,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650788945.589, "dur": 88.191, "args": { "External id": 18772,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 1363 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650789053.983, "dur": 34.383, "args": { "External id": 18773,"Record function id": 0, "Sequence number": 246623, "Fwd thread id": 1, "Ev Idx": 1364 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650789055.208, "dur": 5.053, "args": { "External id": 18774,"Sequence number": 246623, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1365 } }, { "ph": "f", "id": 145, "pid": 1336759, "tid": 1381173, "ts": 1295650789055.208, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650789057.037, "dur": 3.060, "args": { "External id": 18775,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650789058.278, "dur": 1.723, "args": { "External id": 18776,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336759, "tid": 1381173, "ts": 1295650789063.491, "dur": 21.836, "args": { "External id": 18777,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1368 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650789092.157, "dur": 10.220, "args": { "External id": 18778,"Record function id": 0, "Sequence number": 246622, "Fwd thread id": 1, "Ev Idx": 1369 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650789093.324, "dur": 7.255, "args": { "External id": 18779,"Sequence number": 246622, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1370 } }, { "ph": "f", "id": 146, "pid": 1336759, "tid": 1381173, "ts": 1295650789093.324, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650789094.248, "dur": 6.120, "args": { "External id": 18780,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650789097.482, "dur": 2.235, "args": { "External id": 18781,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650789098.949, "dur": 0.650, "args": { "External id": 18782,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1373 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650789106.603, "dur": 5.593, "args": { "External id": 18783,"Record function id": 0, "Ev Idx": 1374 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650789108.366, "dur": 3.346, "args": { "External id": 18784,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650789109.502, "dur": 1.894, "args": { "External id": 18785,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1376 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650789110.026, "dur": 1.277, "args": { "External id": 18786,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1377 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650789116.336, "dur": 427.304, "args": { "External id": 18787,"Record function id": 0, "Sequence number": 246621, "Fwd thread id": 1, "Ev Idx": 1378 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650789122.250, "dur": 388.318, "args": { "External id": 18788,"Sequence number": 246621, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 1379 } }, { "ph": "f", "id": 147, "pid": 1336759, "tid": 1381173, "ts": 1295650789122.250, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336759, "tid": 1381173, "ts": 1295650789146.231, "dur": 32.710, "args": { "External id": 18789,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1381173, "ts": 1295650789147.549, "dur": 31.192, "args": { "External id": 18790,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650789150.296, "dur": 5.768, "args": { "External id": 18791,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 1382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650789152.687, "dur": 2.766, "args": { "External id": 18792,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650789157.396, "dur": 20.816, "args": { "External id": 18793,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650789190.918, "dur": 2.551, "args": { "External id": 18794,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650789191.954, "dur": 1.400, "args": { "External id": 18795,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650789197.238, "dur": 3.029, "args": { "External id": 18796,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650789198.407, "dur": 1.729, "args": { "External id": 18797,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650789214.451, "dur": 2.033, "args": { "External id": 18798,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650789246.531, "dur": 4.224, "args": { "External id": 18799,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650789403.873, "dur": 3.826, "args": { "External id": 18800,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 1391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1381173, "ts": 1295650789412.251, "dur": 32.603, "args": { "External id": 18801,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 1392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650789421.832, "dur": 0.976, "args": { "External id": 18802,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 1393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295650789450.491, "dur": 28.166, "args": { "External id": 18803,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 1394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295650789452.263, "dur": 26.200, "args": { "External id": 18804,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 1395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650789456.608, "dur": 3.595, "args": { "External id": 18805,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650789463.385, "dur": 14.500, "args": { "External id": 18806,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 1397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1381173, "ts": 1295650789482.905, "dur": 2.847, "args": { "External id": 18807,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 1398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650789484.576, "dur": 1.052, "args": { "External id": 18808,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 1399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650789492.269, "dur": 2.646, "args": { "External id": 18809,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650789493.392, "dur": 1.389, "args": { "External id": 18810,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650789497.063, "dur": 2.880, "args": { "External id": 18811,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650789497.893, "dur": 1.947, "args": { "External id": 18812,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1381173, "ts": 1295650789525.420, "dur": 16.587, "args": { "External id": 18813,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1404 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650789556.153, "dur": 8.539, "args": { "External id": 18814,"Record function id": 0, "Ev Idx": 1405 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650789558.538, "dur": 5.392, "args": { "External id": 18815,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650789560.260, "dur": 2.757, "args": { "External id": 18816,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1407 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650789561.291, "dur": 1.634, "args": { "External id": 18817,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1408 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650789568.396, "dur": 9.072, "args": { "External id": 18818,"Record function id": 0, "Sequence number": 246620, "Fwd thread id": 1, "Ev Idx": 1409 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650789569.997, "dur": 5.462, "args": { "External id": 18819,"Sequence number": 246620, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1410 } }, { "ph": "f", "id": 148, "pid": 1336759, "tid": 1381173, "ts": 1295650789569.997, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650789571.425, "dur": 3.853, "args": { "External id": 18820,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650789574.057, "dur": 1.098, "args": { "External id": 18821,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1412 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650789580.697, "dur": 128.533, "args": { "External id": 18822,"Record function id": 0, "Sequence number": 246619, "Fwd thread id": 1, "Ev Idx": 1413 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650789581.800, "dur": 121.503, "args": { "External id": 18823,"Sequence number": 246619, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1414 } }, { "ph": "f", "id": 149, "pid": 1336759, "tid": 1381173, "ts": 1295650789581.800, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650789584.306, "dur": 4.863, "args": { "External id": 18824,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650789585.649, "dur": 2.887, "args": { "External id": 18825,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650789587.484, "dur": 0.850, "args": { "External id": 18826,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650789590.397, "dur": 55.428, "args": { "External id": 18827,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650789649.561, "dur": 5.316, "args": { "External id": 18828,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650789650.233, "dur": 3.979, "args": { "External id": 18829,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650789652.450, "dur": 1.565, "args": { "External id": 18830,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650789656.104, "dur": 3.277, "args": { "External id": 18831,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650789657.006, "dur": 1.922, "args": { "External id": 18832,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650789658.432, "dur": 0.424, "args": { "External id": 18833,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650789662.617, "dur": 39.898, "args": { "External id": 18834,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1425 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650789713.855, "dur": 8.235, "args": { "External id": 18835,"Record function id": 0, "Sequence number": 246618, "Fwd thread id": 1, "Ev Idx": 1426 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650789714.785, "dur": 5.516, "args": { "External id": 18836,"Sequence number": 246618, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1427 } }, { "ph": "f", "id": 150, "pid": 1336759, "tid": 1381173, "ts": 1295650789714.785, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650789716.582, "dur": 3.561, "args": { "External id": 18837,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650789717.742, "dur": 2.294, "args": { "External id": 18838,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1429 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650789725.511, "dur": 8.688, "args": { "External id": 18839,"Record function id": 0, "Sequence number": 246617, "Fwd thread id": 1, "Ev Idx": 1430 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650789726.317, "dur": 6.112, "args": { "External id": 18840,"Sequence number": 246617, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1431 } }, { "ph": "f", "id": 151, "pid": 1336759, "tid": 1381173, "ts": 1295650789726.317, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650789727.248, "dur": 4.985, "args": { "External id": 18841,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650789727.992, "dur": 3.727, "args": { "External id": 18842,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650789731.121, "dur": 0.454, "args": { "External id": 18843,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1434 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650789738.122, "dur": 5.252, "args": { "External id": 18844,"Record function id": 0, "Ev Idx": 1435 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650789739.960, "dur": 2.952, "args": { "External id": 18845,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650789741.117, "dur": 1.549, "args": { "External id": 18846,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1437 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650789741.480, "dur": 1.114, "args": { "External id": 18847,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1438 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650789746.445, "dur": 5.917, "args": { "External id": 18848,"Record function id": 0, "Sequence number": 246616, "Fwd thread id": 1, "Ev Idx": 1439 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650789747.196, "dur": 3.624, "args": { "External id": 18849,"Sequence number": 246616, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1440 } }, { "ph": "f", "id": 152, "pid": 1336759, "tid": 1381173, "ts": 1295650789747.196, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650789748.254, "dur": 2.410, "args": { "External id": 18850,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650789749.289, "dur": 1.232, "args": { "External id": 18851,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1442 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650789756.594, "dur": 312.518, "args": { "External id": 18852,"Record function id": 0, "Sequence number": 246615, "Fwd thread id": 1, "Ev Idx": 1443 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650789758.299, "dur": 294.639, "args": { "External id": 18853,"Sequence number": 246615, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1444 } }, { "ph": "f", "id": 153, "pid": 1336759, "tid": 1381173, "ts": 1295650789758.299, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650789770.852, "dur": 6.603, "args": { "External id": 18854,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650789773.639, "dur": 3.373, "args": { "External id": 18855,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650789779.490, "dur": 3.804, "args": { "External id": 18856,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650789781.247, "dur": 1.863, "args": { "External id": 18857,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650789784.542, "dur": 3.428, "args": { "External id": 18858,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650789786.174, "dur": 1.575, "args": { "External id": 18859,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1450 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650789812.174, "dur": 168.264, "args": { "External id": 18860,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650789890.839, "dur": 4.221, "args": { "External id": 18861,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650789896.944, "dur": 3.909, "args": { "External id": 18862,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336759, "tid": 1381173, "ts": 1295650790039.337, "dur": 4.213, "args": { "External id": 18863,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336759, "tid": 1381173, "ts": 1295650790047.079, "dur": 0.724, "args": { "External id": 18864,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336759, "tid": 1381173, "ts": 1295650790049.827, "dur": 0.478, "args": { "External id": 18865,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1456 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650790079.050, "dur": 260.365, "args": { "External id": 18866,"Record function id": 0, "Sequence number": 246614, "Fwd thread id": 1, "Ev Idx": 1457 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650790081.322, "dur": 250.254, "args": { "External id": 18867,"Sequence number": 246614, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1458 } }, { "ph": "f", "id": 154, "pid": 1336759, "tid": 1381173, "ts": 1295650790081.322, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1381173, "ts": 1295650790101.839, "dur": 53.239, "args": { "External id": 18868,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650790105.144, "dur": 3.917, "args": { "External id": 18869,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650790110.733, "dur": 43.785, "args": { "External id": 18870,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 1461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650790164.187, "dur": 4.755, "args": { "External id": 18871,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650790166.426, "dur": 2.181, "args": { "External id": 18872,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1463 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650790349.246, "dur": 160.220, "args": { "External id": 18873,"Record function id": 0, "Sequence number": 246613, "Fwd thread id": 1, "Ev Idx": 1464 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650790351.657, "dur": 151.530, "args": { "External id": 18874,"Sequence number": 246613, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1465 } }, { "ph": "f", "id": 155, "pid": 1336759, "tid": 1381173, "ts": 1295650790351.657, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1381173, "ts": 1295650790364.550, "dur": 35.221, "args": { "External id": 18875,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650790367.661, "dur": 3.109, "args": { "External id": 18876,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650790371.952, "dur": 27.196, "args": { "External id": 18877,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 1468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1381173, "ts": 1295650790407.828, "dur": 5.061, "args": { "External id": 18878,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650790410.029, "dur": 2.548, "args": { "External id": 18879,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1470 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790515.564, "dur": 15.662, "args": { "External id": 18880,"Record function id": 0, "Sequence number": 246612, "Fwd thread id": 1, "Ev Idx": 1471 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790517.246, "dur": 11.646, "args": { "External id": 18881,"Sequence number": 246612, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1472 } }, { "ph": "f", "id": 156, "pid": 1336759, "tid": 1381173, "ts": 1295650790517.246, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650790520.054, "dur": 8.517, "args": { "External id": 18882,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1473 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650790522.021, "dur": 6.357, "args": { "External id": 18883,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1474 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790534.612, "dur": 6.125, "args": { "External id": 18884,"Record function id": 0, "Sequence number": 246611, "Fwd thread id": 1, "Ev Idx": 1475 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790535.387, "dur": 3.713, "args": { "External id": 18885,"Sequence number": 246611, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1476 } }, { "ph": "f", "id": 157, "pid": 1336759, "tid": 1381173, "ts": 1295650790535.387, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650790536.804, "dur": 2.150, "args": { "External id": 18886,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650790537.881, "dur": 0.934, "args": { "External id": 18887,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1478 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790543.766, "dur": 8.213, "args": { "External id": 18888,"Record function id": 0, "Sequence number": 246610, "Fwd thread id": 1, "Ev Idx": 1479 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790545.108, "dur": 5.307, "args": { "External id": 18889,"Sequence number": 246610, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1480 } }, { "ph": "f", "id": 158, "pid": 1336759, "tid": 1381173, "ts": 1295650790545.108, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650790548.188, "dur": 2.088, "args": { "External id": 18890,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650790549.275, "dur": 0.875, "args": { "External id": 18891,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1482 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790555.248, "dur": 5.947, "args": { "External id": 18892,"Record function id": 0, "Sequence number": 246609, "Fwd thread id": 1, "Ev Idx": 1483 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790556.984, "dur": 2.587, "args": { "External id": 18893,"Sequence number": 246609, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1484 } }, { "ph": "f", "id": 159, "pid": 1336759, "tid": 1381173, "ts": 1295650790556.984, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650790557.872, "dur": 1.558, "args": { "External id": 18894,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650790558.568, "dur": 0.761, "args": { "External id": 18895,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1486 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790564.502, "dur": 143.986, "args": { "External id": 18896,"Record function id": 0, "Sequence number": 246608, "Fwd thread id": 1, "Ev Idx": 1487 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790565.344, "dur": 136.202, "args": { "External id": 18897,"Sequence number": 246608, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1488 } }, { "ph": "f", "id": 160, "pid": 1336759, "tid": 1381173, "ts": 1295650790565.344, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650790568.193, "dur": 9.235, "args": { "External id": 18898,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650790572.394, "dur": 4.399, "args": { "External id": 18899,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650790574.868, "dur": 1.689, "args": { "External id": 18900,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650790579.135, "dur": 64.781, "args": { "External id": 18901,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650790645.022, "dur": 5.144, "args": { "External id": 18902,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650790645.845, "dur": 3.513, "args": { "External id": 18903,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650790647.660, "dur": 1.522, "args": { "External id": 18904,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650790651.622, "dur": 6.150, "args": { "External id": 18905,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650790654.776, "dur": 2.563, "args": { "External id": 18906,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650790656.870, "dur": 0.387, "args": { "External id": 18907,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650790658.579, "dur": 41.960, "args": { "External id": 18908,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1499 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790713.319, "dur": 7.267, "args": { "External id": 18909,"Record function id": 0, "Sequence number": 246607, "Fwd thread id": 1, "Ev Idx": 1500 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790714.189, "dur": 4.349, "args": { "External id": 18910,"Sequence number": 246607, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1501 } }, { "ph": "f", "id": 161, "pid": 1336759, "tid": 1381173, "ts": 1295650790714.189, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650790715.939, "dur": 2.438, "args": { "External id": 18911,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650790716.927, "dur": 1.320, "args": { "External id": 18912,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1503 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790723.803, "dur": 9.099, "args": { "External id": 18913,"Record function id": 0, "Sequence number": 246606, "Fwd thread id": 1, "Ev Idx": 1504 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790724.640, "dur": 6.476, "args": { "External id": 18914,"Sequence number": 246606, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1505 } }, { "ph": "f", "id": 162, "pid": 1336759, "tid": 1381173, "ts": 1295650790724.640, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650790727.256, "dur": 3.677, "args": { "External id": 18915,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650790728.330, "dur": 2.112, "args": { "External id": 18916,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650790729.997, "dur": 0.322, "args": { "External id": 18917,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1508 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650790738.685, "dur": 8.906, "args": { "External id": 18918,"Record function id": 0, "Ev Idx": 1509 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650790740.530, "dur": 6.220, "args": { "External id": 18919,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650790742.831, "dur": 3.545, "args": { "External id": 18920,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1511 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650790743.936, "dur": 2.341, "args": { "External id": 18921,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1512 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790751.097, "dur": 8.312, "args": { "External id": 18922,"Record function id": 0, "Sequence number": 246605, "Fwd thread id": 1, "Ev Idx": 1513 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790752.463, "dur": 4.704, "args": { "External id": 18923,"Sequence number": 246605, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1514 } }, { "ph": "f", "id": 163, "pid": 1336759, "tid": 1381173, "ts": 1295650790752.463, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650790753.385, "dur": 3.650, "args": { "External id": 18924,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650790756.206, "dur": 0.690, "args": { "External id": 18925,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1516 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790762.527, "dur": 84.337, "args": { "External id": 18926,"Record function id": 0, "Sequence number": 246604, "Fwd thread id": 1, "Ev Idx": 1517 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790763.394, "dur": 78.857, "args": { "External id": 18927,"Sequence number": 246604, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1518 } }, { "ph": "f", "id": 164, "pid": 1336759, "tid": 1381173, "ts": 1295650790763.394, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650790765.024, "dur": 3.143, "args": { "External id": 18928,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650790765.743, "dur": 1.999, "args": { "External id": 18929,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650790767.283, "dur": 0.350, "args": { "External id": 18930,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650790768.790, "dur": 25.491, "args": { "External id": 18931,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650790797.841, "dur": 4.175, "args": { "External id": 18932,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650790798.349, "dur": 3.170, "args": { "External id": 18933,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650790799.955, "dur": 1.425, "args": { "External id": 18934,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650790802.970, "dur": 3.990, "args": { "External id": 18935,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650790803.830, "dur": 2.643, "args": { "External id": 18936,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650790805.129, "dur": 1.279, "args": { "External id": 18937,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650790809.498, "dur": 32.116, "args": { "External id": 18938,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1529 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790852.993, "dur": 33.216, "args": { "External id": 18939,"Record function id": 0, "Sequence number": 246603, "Fwd thread id": 1, "Ev Idx": 1530 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790853.883, "dur": 7.410, "args": { "External id": 18940,"Sequence number": 246603, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1531 } }, { "ph": "f", "id": 165, "pid": 1336759, "tid": 1381173, "ts": 1295650790853.883, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650790855.502, "dur": 5.639, "args": { "External id": 18941,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650790859.697, "dur": 1.345, "args": { "External id": 18942,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336759, "tid": 1381173, "ts": 1295650790864.453, "dur": 19.583, "args": { "External id": 18943,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1534 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790889.606, "dur": 32.069, "args": { "External id": 18944,"Record function id": 0, "Sequence number": 246602, "Fwd thread id": 1, "Ev Idx": 1535 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790912.754, "dur": 6.856, "args": { "External id": 18945,"Sequence number": 246602, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1536 } }, { "ph": "f", "id": 166, "pid": 1336759, "tid": 1381173, "ts": 1295650790912.754, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650790915.493, "dur": 3.923, "args": { "External id": 18946,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650790916.214, "dur": 2.639, "args": { "External id": 18947,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650790918.411, "dur": 0.346, "args": { "External id": 18948,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1539 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650790925.801, "dur": 4.759, "args": { "External id": 18949,"Record function id": 0, "Ev Idx": 1540 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650790927.393, "dur": 2.690, "args": { "External id": 18950,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650790928.297, "dur": 1.480, "args": { "External id": 18951,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1542 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650790928.695, "dur": 0.943, "args": { "External id": 18952,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1543 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790933.949, "dur": 11.228, "args": { "External id": 18953,"Record function id": 0, "Sequence number": 246601, "Fwd thread id": 1, "Ev Idx": 1544 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790938.626, "dur": 4.695, "args": { "External id": 18954,"Sequence number": 246601, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1545 } }, { "ph": "f", "id": 167, "pid": 1336759, "tid": 1381173, "ts": 1295650790938.626, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650790939.548, "dur": 3.635, "args": { "External id": 18955,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650790942.350, "dur": 0.728, "args": { "External id": 18956,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1547 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790948.298, "dur": 134.312, "args": { "External id": 18957,"Record function id": 0, "Sequence number": 246600, "Fwd thread id": 1, "Ev Idx": 1548 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650790948.972, "dur": 124.999, "args": { "External id": 18958,"Sequence number": 246600, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1549 } }, { "ph": "f", "id": 168, "pid": 1336759, "tid": 1381173, "ts": 1295650790948.972, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650790950.687, "dur": 2.861, "args": { "External id": 18959,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650790951.094, "dur": 1.996, "args": { "External id": 18960,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650790952.478, "dur": 0.489, "args": { "External id": 18961,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650790954.048, "dur": 26.018, "args": { "External id": 18962,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650790982.836, "dur": 44.538, "args": { "External id": 18963,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650790983.403, "dur": 43.107, "args": { "External id": 18964,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791025.150, "dur": 0.879, "args": { "External id": 18965,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650791028.662, "dur": 3.368, "args": { "External id": 18966,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650791029.716, "dur": 1.893, "args": { "External id": 18967,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791031.282, "dur": 0.241, "args": { "External id": 18968,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650791034.640, "dur": 38.622, "args": { "External id": 18969,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1560 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650791088.873, "dur": 25.543, "args": { "External id": 18970,"Record function id": 0, "Sequence number": 246599, "Fwd thread id": 1, "Ev Idx": 1561 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650791089.870, "dur": 3.930, "args": { "External id": 18971,"Sequence number": 246599, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1562 } }, { "ph": "f", "id": 169, "pid": 1336759, "tid": 1381173, "ts": 1295650791089.870, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650791091.437, "dur": 2.210, "args": { "External id": 18972,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650791092.384, "dur": 1.166, "args": { "External id": 18973,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1381173, "ts": 1295650791096.597, "dur": 15.882, "args": { "External id": 18974,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1565 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650791117.787, "dur": 8.356, "args": { "External id": 18975,"Record function id": 0, "Sequence number": 246598, "Fwd thread id": 1, "Ev Idx": 1566 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336759, "tid": 1381173, "ts": 1295650791118.865, "dur": 5.757, "args": { "External id": 18976,"Sequence number": 246598, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1567 } }, { "ph": "f", "id": 170, "pid": 1336759, "tid": 1381173, "ts": 1295650791118.865, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1381173, "ts": 1295650791119.431, "dur": 4.989, "args": { "External id": 18977,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1381173, "ts": 1295650791120.159, "dur": 3.748, "args": { "External id": 18978,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791123.300, "dur": 0.495, "args": { "External id": 18979,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1570 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650791130.146, "dur": 5.141, "args": { "External id": 18980,"Record function id": 0, "Ev Idx": 1571 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650791131.735, "dur": 3.080, "args": { "External id": 18981,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650791132.968, "dur": 1.564, "args": { "External id": 18982,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1573 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650791133.359, "dur": 1.056, "args": { "External id": 18983,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1574 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650791139.023, "dur": 372.434, "args": { "External id": 18984,"Record function id": 0, "Sequence number": 246597, "Fwd thread id": 1, "Ev Idx": 1575 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650791140.693, "dur": 338.425, "args": { "External id": 18985,"Sequence number": 246597, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1576 } }, { "ph": "f", "id": 171, "pid": 1336759, "tid": 1381173, "ts": 1295650791140.693, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650791173.755, "dur": 2.075, "args": { "External id": 18986,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650791174.651, "dur": 1.016, "args": { "External id": 18987,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650791192.145, "dur": 4.936, "args": { "External id": 18988,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650791206.754, "dur": 1.708, "args": { "External id": 18989,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650791376.839, "dur": 3.282, "args": { "External id": 18990,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 1581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1381173, "ts": 1295650791384.607, "dur": 35.668, "args": { "External id": 18991,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 1582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791395.453, "dur": 0.971, "args": { "External id": 18992,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 1583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295650791425.754, "dur": 31.518, "args": { "External id": 18993,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 1584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295650791427.671, "dur": 29.396, "args": { "External id": 18994,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 1585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791432.653, "dur": 4.491, "args": { "External id": 18995,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650791440.640, "dur": 15.950, "args": { "External id": 18996,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 1587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1381173, "ts": 1295650791461.653, "dur": 2.857, "args": { "External id": 18997,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 1588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650791462.997, "dur": 1.356, "args": { "External id": 18998,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 1589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1381173, "ts": 1295650791470.593, "dur": 2.185, "args": { "External id": 18999,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650791471.859, "dur": 0.830, "args": { "External id": 19000,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1381173, "ts": 1295650791492.376, "dur": 14.816, "args": { "External id": 19001,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1592 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650791522.653, "dur": 10.859, "args": { "External id": 19002,"Record function id": 0, "Ev Idx": 1593 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650791524.934, "dur": 7.708, "args": { "External id": 19003,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650791526.793, "dur": 4.886, "args": { "External id": 19004,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1595 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650791529.970, "dur": 1.616, "args": { "External id": 19005,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1596 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650791537.823, "dur": 2539.377, "args": { "External id": 19006,"Record function id": 0, "Ev Idx": 1597 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.27)", "pid": 1336759, "tid": 1381173, "ts": 1295650791567.209, "dur": 866.165, "args": { "External id": 19007,"Record function id": 0, "Ev Idx": 1598 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.26", "pid": 1336759, "tid": 1381173, "ts": 1295650791590.289, "dur": 834.745, "args": { "External id": 19008,"Record function id": 0, "Ev Idx": 1599 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.26)", "pid": 1336759, "tid": 1381173, "ts": 1295650791602.866, "dur": 806.543, "args": { "External id": 19009,"Record function id": 0, "Ev Idx": 1600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650791672.704, "dur": 5.339, "args": { "External id": 19010,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295650791693.451, "dur": 27.401, "args": { "External id": 19011,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791697.551, "dur": 1.194, "args": { "External id": 19012,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791700.710, "dur": 1.654, "args": { "External id": 19013,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791704.553, "dur": 0.388, "args": { "External id": 19014,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791706.240, "dur": 0.550, "args": { "External id": 19015,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791708.062, "dur": 0.345, "args": { "External id": 19016,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791710.232, "dur": 0.172, "args": { "External id": 19017,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791711.668, "dur": 0.590, "args": { "External id": 19018,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791714.073, "dur": 0.436, "args": { "External id": 19019,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791716.240, "dur": 0.391, "args": { "External id": 19020,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650791734.368, "dur": 30.578, "args": { "External id": 19021,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1612 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295650791800.241, "dur": 105.921, "args": { "External id": 19022,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 1613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650791811.363, "dur": 4.779, "args": { "External id": 19023,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295650791821.862, "dur": 10.355, "args": { "External id": 19024,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295650791825.759, "dur": 6.057, "args": { "External id": 19025,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 1616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791829.965, "dur": 0.577, "args": { "External id": 19026,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295650791839.106, "dur": 25.736, "args": { "External id": 19027,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791841.370, "dur": 0.620, "args": { "External id": 19028,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791844.288, "dur": 0.460, "args": { "External id": 19029,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791846.495, "dur": 0.686, "args": { "External id": 19030,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791849.006, "dur": 0.322, "args": { "External id": 19031,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791850.970, "dur": 0.458, "args": { "External id": 19032,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791853.123, "dur": 0.384, "args": { "External id": 19033,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791855.159, "dur": 1.208, "args": { "External id": 19034,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791857.941, "dur": 0.498, "args": { "External id": 19035,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650791860.240, "dur": 0.446, "args": { "External id": 19036,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650791875.035, "dur": 23.108, "args": { "External id": 19037,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1628 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295650791959.651, "dur": 345.322, "args": { "External id": 19038,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 1629 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295650792027.509, "dur": 271.137, "args": { "External id": 19039,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1630, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295650792040.777, "dur": 252.359, "args": { "External id": 19040,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 1631 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295650792328.552, "dur": 2.279, "args": { "External id": 19041,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1632, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650792441.558, "dur": 1616.061, "args": { "External id": 19042,"Sequence number": 246596, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1633 } }, { "ph": "f", "id": 172, "pid": 1336759, "tid": 1381173, "ts": 1295650792441.558, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650792557.646, "dur": 111.534, "args": { "External id": 19043,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 1634 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295650792711.719, "dur": 37.097, "args": { "External id": 19044,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 1635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295650792767.543, "dur": 47.096, "args": { "External id": 19045,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 1636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650792823.420, "dur": 31.969, "args": { "External id": 19046,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650792861.811, "dur": 46.504, "args": { "External id": 19047,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650792915.839, "dur": 28.467, "args": { "External id": 19048,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650792951.952, "dur": 85.803, "args": { "External id": 19049,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1640 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295650793066.860, "dur": 23.688, "args": { "External id": 19050,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 1641 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295650793109.278, "dur": 28.298, "args": { "External id": 19051,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1642 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295650793159.775, "dur": 19.383, "args": { "External id": 19052,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1643 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295650793194.565, "dur": 14.740, "args": { "External id": 19053,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650793220.247, "dur": 52.694, "args": { "External id": 19054,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650793278.270, "dur": 35.691, "args": { "External id": 19055,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1646 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650793343.612, "dur": 176.101, "args": { "External id": 19056,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650793427.922, "dur": 5.526, "args": { "External id": 19057,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650793435.971, "dur": 3.071, "args": { "External id": 19058,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1649 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295650793551.426, "dur": 25.204, "args": { "External id": 19059,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1650 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295650793588.858, "dur": 14.499, "args": { "External id": 19060,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650793612.057, "dur": 35.572, "args": { "External id": 19061,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650793654.859, "dur": 34.158, "args": { "External id": 19062,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650793696.221, "dur": 21.375, "args": { "External id": 19063,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650793724.179, "dur": 30.049, "args": { "External id": 19064,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650793760.549, "dur": 20.190, "args": { "External id": 19065,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650793788.130, "dur": 30.566, "args": { "External id": 19066,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1657 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295650793835.640, "dur": 21.619, "args": { "External id": 19067,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 1658 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295650793873.507, "dur": 23.061, "args": { "External id": 19068,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1659 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295650793912.339, "dur": 16.444, "args": { "External id": 19069,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1660 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295650793942.461, "dur": 14.071, "args": { "External id": 19070,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1661 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295650793970.599, "dur": 55.217, "args": { "External id": 19071,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 1662 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794100.956, "dur": 15.595, "args": { "External id": 19072,"Record function id": 0, "Ev Idx": 1663 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794104.640, "dur": 10.927, "args": { "External id": 19073,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794108.814, "dur": 5.752, "args": { "External id": 19074,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1665 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794110.418, "dur": 3.999, "args": { "External id": 19075,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1666 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794120.609, "dur": 6.000, "args": { "External id": 19076,"Record function id": 0, "Ev Idx": 1667 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794122.535, "dur": 3.614, "args": { "External id": 19077,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794123.362, "dur": 2.262, "args": { "External id": 19078,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1669 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794124.515, "dur": 0.998, "args": { "External id": 19079,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1670 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794130.054, "dur": 5.246, "args": { "External id": 19080,"Record function id": 0, "Ev Idx": 1671 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794132.176, "dur": 2.699, "args": { "External id": 19081,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794132.650, "dur": 1.687, "args": { "External id": 19082,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1673 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794133.249, "dur": 1.001, "args": { "External id": 19083,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1674 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794138.633, "dur": 5.290, "args": { "External id": 19084,"Record function id": 0, "Ev Idx": 1675 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794140.332, "dur": 3.183, "args": { "External id": 19085,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794140.851, "dur": 2.238, "args": { "External id": 19086,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1677 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794141.405, "dur": 1.595, "args": { "External id": 19087,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1678 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794147.373, "dur": 3.889, "args": { "External id": 19088,"Record function id": 0, "Ev Idx": 1679 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794148.811, "dur": 2.007, "args": { "External id": 19089,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794149.366, "dur": 1.062, "args": { "External id": 19090,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1681 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794149.729, "dur": 0.593, "args": { "External id": 19091,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1682 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794154.684, "dur": 4.577, "args": { "External id": 19092,"Record function id": 0, "Ev Idx": 1683 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794156.373, "dur": 2.471, "args": { "External id": 19093,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794157.031, "dur": 1.417, "args": { "External id": 19094,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1685 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794157.800, "dur": 0.537, "args": { "External id": 19095,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1686 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794162.696, "dur": 3.943, "args": { "External id": 19096,"Record function id": 0, "Ev Idx": 1687 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794164.168, "dur": 2.049, "args": { "External id": 19097,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794164.616, "dur": 1.161, "args": { "External id": 19098,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1689 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794165.026, "dur": 0.647, "args": { "External id": 19099,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1690 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794169.782, "dur": 4.119, "args": { "External id": 19100,"Record function id": 0, "Ev Idx": 1691 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794171.703, "dur": 1.790, "args": { "External id": 19101,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794172.167, "dur": 0.916, "args": { "External id": 19102,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1693 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794172.563, "dur": 0.454, "args": { "External id": 19103,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1694 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794177.161, "dur": 4.056, "args": { "External id": 19104,"Record function id": 0, "Ev Idx": 1695 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650794178.529, "dur": 2.270, "args": { "External id": 19105,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794179.069, "dur": 1.212, "args": { "External id": 19106,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1697 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650794179.640, "dur": 0.548, "args": { "External id": 19107,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1698 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650794185.913, "dur": 167397.406, "args": { "External id": 19108,"Record function id": 0, "Sequence number": 246595, "Fwd thread id": 1, "Ev Idx": 1699 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650794187.522, "dur": 167387.216, "args": { "External id": 19109,"Sequence number": 246595, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1700 } }, { "ph": "f", "id": 173, "pid": 1336759, "tid": 1381173, "ts": 1295650794187.522, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.27)", "pid": 1336759, "tid": 1381173, "ts": 1295650794216.437, "dur": 56.843, "args": { "External id": 19110,"Record function id": 0, "Ev Idx": 1701 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.27)", "pid": 1336759, "tid": 1381173, "ts": 1295650794282.551, "dur": 63.829, "args": { "External id": 19111,"Record function id": 0, "Ev Idx": 1702 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.27)", "pid": 1336759, "tid": 1381173, "ts": 1295650794352.891, "dur": 167212.558, "args": { "External id": 19112,"Record function id": 0, "Ev Idx": 1703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650794407.090, "dur": 7.933, "args": { "External id": 19113,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650794425.074, "dur": 5.004, "args": { "External id": 19114,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 1705 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295650794445.706, "dur": 166247.911, "args": { "External id": 19115,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 1706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295650794460.397, "dur": 166220.382, "args": { "External id": 19116,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 1707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650794534.749, "dur": 4.775, "args": { "External id": 19117,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295650794546.212, "dur": 166083.220, "args": { "External id": 19118,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 1709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295650794548.877, "dur": 166079.420, "args": { "External id": 19119,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 1710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650794553.500, "dur": 4.958, "args": { "External id": 19120,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650794560.658, "dur": 166062.577, "args": { "External id": 19121,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 1712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295650960804.798, "dur": 12.675, "args": { "External id": 19122,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 1713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650960809.056, "dur": 7.995, "args": { "External id": 19123,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1714 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295650960852.760, "dur": 394.732, "args": { "External id": 19124,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 1715 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295650960881.407, "dur": 360.113, "args": { "External id": 19125,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1716, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295650960893.842, "dur": 327.942, "args": { "External id": 19126,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 1717 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295650961269.815, "dur": 2.711, "args": { "External id": 19127,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1718, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650961336.571, "dur": 7.421, "args": { "External id": 19128,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650961394.695, "dur": 1.358, "args": { "External id": 19129,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1720 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650961414.724, "dur": 0.941, "args": { "External id": 19130,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650961430.497, "dur": 1.039, "args": { "External id": 19131,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650961444.133, "dur": 0.927, "args": { "External id": 19132,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650961457.440, "dur": 1.306, "args": { "External id": 19133,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650961471.491, "dur": 0.928, "args": { "External id": 19134,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650961485.763, "dur": 2.365, "args": { "External id": 19135,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650961499.721, "dur": 0.713, "args": { "External id": 19136,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1727 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650961599.744, "dur": 2760.582, "args": { "External id": 19137,"Record function id": 0, "Ev Idx": 1728 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.26)", "pid": 1336759, "tid": 1381173, "ts": 1295650961618.913, "dur": 1062.738, "args": { "External id": 19138,"Record function id": 0, "Ev Idx": 1729 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.26)", "pid": 1336759, "tid": 1381173, "ts": 1295650961635.613, "dur": 320.617, "args": { "External id": 19139,"Record function id": 0, "Ev Idx": 1730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650961709.772, "dur": 4.630, "args": { "External id": 19140,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 1731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650961717.863, "dur": 0.988, "args": { "External id": 19141,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 1732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650961720.664, "dur": 0.740, "args": { "External id": 19142,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650961723.414, "dur": 1.501, "args": { "External id": 19143,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650961726.428, "dur": 1.210, "args": { "External id": 19144,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650961729.284, "dur": 0.769, "args": { "External id": 19145,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650961731.621, "dur": 1.895, "args": { "External id": 19146,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 1737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650961735.106, "dur": 0.974, "args": { "External id": 19147,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650961737.643, "dur": 0.905, "args": { "External id": 19148,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650961740.059, "dur": 0.701, "args": { "External id": 19149,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1740 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295650961758.606, "dur": 161.903, "args": { "External id": 19150,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 1741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295650961774.776, "dur": 141.217, "args": { "External id": 19151,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 1742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650961798.613, "dur": 12.437, "args": { "External id": 19152,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295650961814.433, "dur": 71.675, "args": { "External id": 19153,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 1744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295650961817.072, "dur": 68.666, "args": { "External id": 19154,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 1745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650961821.510, "dur": 7.889, "args": { "External id": 19155,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650961831.162, "dur": 53.596, "args": { "External id": 19156,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 1747 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.25", "pid": 1336759, "tid": 1381173, "ts": 1295650962083.848, "dur": 588.583, "args": { "External id": 19157,"Record function id": 0, "Ev Idx": 1748 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.25)", "pid": 1336759, "tid": 1381173, "ts": 1295650962103.089, "dur": 555.464, "args": { "External id": 19158,"Record function id": 0, "Ev Idx": 1749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650962161.686, "dur": 6.416, "args": { "External id": 19159,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295650962184.628, "dur": 32.165, "args": { "External id": 19160,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962190.585, "dur": 1.733, "args": { "External id": 19161,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962194.716, "dur": 0.383, "args": { "External id": 19162,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962196.945, "dur": 0.602, "args": { "External id": 19163,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962199.291, "dur": 0.549, "args": { "External id": 19164,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962201.844, "dur": 0.399, "args": { "External id": 19165,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962204.281, "dur": 0.655, "args": { "External id": 19166,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962206.872, "dur": 1.324, "args": { "External id": 19167,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962209.831, "dur": 0.472, "args": { "External id": 19168,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962211.886, "dur": 0.309, "args": { "External id": 19169,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650962246.503, "dur": 37.034, "args": { "External id": 19170,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1761 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295650962320.610, "dur": 107.895, "args": { "External id": 19171,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 1762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650962332.000, "dur": 4.459, "args": { "External id": 19172,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295650962342.018, "dur": 11.362, "args": { "External id": 19173,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295650962346.669, "dur": 6.280, "args": { "External id": 19174,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 1765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962350.437, "dur": 0.881, "args": { "External id": 19175,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295650962361.209, "dur": 25.846, "args": { "External id": 19176,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962363.786, "dur": 0.371, "args": { "External id": 19177,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962366.054, "dur": 0.479, "args": { "External id": 19178,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962368.293, "dur": 0.689, "args": { "External id": 19179,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962370.788, "dur": 1.345, "args": { "External id": 19180,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962374.119, "dur": 0.585, "args": { "External id": 19181,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962376.467, "dur": 0.417, "args": { "External id": 19182,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962378.783, "dur": 0.330, "args": { "External id": 19183,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962380.583, "dur": 0.387, "args": { "External id": 19184,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650962383.186, "dur": 0.419, "args": { "External id": 19185,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650962400.061, "dur": 20.164, "args": { "External id": 19186,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1777 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295650962478.024, "dur": 114.252, "args": { "External id": 19187,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 1778 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295650962500.342, "dur": 88.283, "args": { "External id": 19188,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1779, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295650962513.188, "dur": 71.403, "args": { "External id": 19189,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 1780 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295650962607.024, "dur": 1.885, "args": { "External id": 19190,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1781, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650962688.627, "dur": 1650.700, "args": { "External id": 19191,"Sequence number": 246594, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1782 } }, { "ph": "f", "id": 174, "pid": 1336759, "tid": 1381173, "ts": 1295650962688.627, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650962792.353, "dur": 103.302, "args": { "External id": 19192,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 1783 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295650962935.791, "dur": 36.661, "args": { "External id": 19193,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 1784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295650963031.644, "dur": 59.833, "args": { "External id": 19194,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 1785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650963103.164, "dur": 32.594, "args": { "External id": 19195,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650963144.331, "dur": 45.853, "args": { "External id": 19196,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650963198.365, "dur": 28.095, "args": { "External id": 19197,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650963252.102, "dur": 47.580, "args": { "External id": 19198,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1789 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295650963325.647, "dur": 23.059, "args": { "External id": 19199,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 1790 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295650963369.014, "dur": 27.232, "args": { "External id": 19200,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1791 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295650963417.205, "dur": 19.070, "args": { "External id": 19201,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1792 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295650963450.195, "dur": 13.502, "args": { "External id": 19202,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650963472.309, "dur": 28.820, "args": { "External id": 19203,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650963504.617, "dur": 32.321, "args": { "External id": 19204,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1795 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295650963565.089, "dur": 166.011, "args": { "External id": 19205,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650963642.666, "dur": 5.504, "args": { "External id": 19206,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650963650.641, "dur": 2.272, "args": { "External id": 19207,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1798 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295650963773.900, "dur": 23.972, "args": { "External id": 19208,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1799 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295650963813.382, "dur": 14.126, "args": { "External id": 19209,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650963835.930, "dur": 32.865, "args": { "External id": 19210,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650963875.330, "dur": 33.887, "args": { "External id": 19211,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650963918.243, "dur": 20.898, "args": { "External id": 19212,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650963945.388, "dur": 29.899, "args": { "External id": 19213,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650963980.981, "dur": 61.707, "args": { "External id": 19214,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295650964053.962, "dur": 49.276, "args": { "External id": 19215,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1806 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295650964127.709, "dur": 22.966, "args": { "External id": 19216,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 1807 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295650964167.229, "dur": 23.739, "args": { "External id": 19217,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1808 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295650964204.355, "dur": 19.324, "args": { "External id": 19218,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1809 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295650964257.137, "dur": 16.019, "args": { "External id": 19219,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1810 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295650964293.268, "dur": 15.363, "args": { "External id": 19220,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 1811 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964383.907, "dur": 16.052, "args": { "External id": 19221,"Record function id": 0, "Ev Idx": 1812 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964387.351, "dur": 11.728, "args": { "External id": 19222,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964392.044, "dur": 6.072, "args": { "External id": 19223,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1814 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964393.814, "dur": 4.201, "args": { "External id": 19224,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1815 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964403.894, "dur": 5.519, "args": { "External id": 19225,"Record function id": 0, "Ev Idx": 1816 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964405.372, "dur": 3.630, "args": { "External id": 19226,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964406.384, "dur": 2.169, "args": { "External id": 19227,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1818 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964407.280, "dur": 1.175, "args": { "External id": 19228,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1819 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964412.808, "dur": 4.355, "args": { "External id": 19229,"Record function id": 0, "Ev Idx": 1820 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964414.015, "dur": 2.754, "args": { "External id": 19230,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964414.791, "dur": 1.543, "args": { "External id": 19231,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1822 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964415.202, "dur": 1.040, "args": { "External id": 19232,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1823 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964420.308, "dur": 5.069, "args": { "External id": 19233,"Record function id": 0, "Ev Idx": 1824 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964421.600, "dur": 3.387, "args": { "External id": 19234,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964422.229, "dur": 2.346, "args": { "External id": 19235,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1826 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964422.789, "dur": 1.719, "args": { "External id": 19236,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1827 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964428.454, "dur": 3.587, "args": { "External id": 19237,"Record function id": 0, "Ev Idx": 1828 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964429.754, "dur": 1.899, "args": { "External id": 19238,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964430.325, "dur": 0.917, "args": { "External id": 19239,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1830 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964430.574, "dur": 0.607, "args": { "External id": 19240,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1831 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964435.173, "dur": 3.527, "args": { "External id": 19241,"Record function id": 0, "Ev Idx": 1832 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964436.200, "dur": 2.111, "args": { "External id": 19242,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964436.673, "dur": 1.222, "args": { "External id": 19243,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1834 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964437.240, "dur": 0.554, "args": { "External id": 19244,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1835 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964441.900, "dur": 4.062, "args": { "External id": 19245,"Record function id": 0, "Ev Idx": 1836 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964443.054, "dur": 2.517, "args": { "External id": 19246,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964443.933, "dur": 1.188, "args": { "External id": 19247,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1838 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964444.380, "dur": 0.635, "args": { "External id": 19248,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1839 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964449.017, "dur": 3.550, "args": { "External id": 19249,"Record function id": 0, "Ev Idx": 1840 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964450.146, "dur": 2.025, "args": { "External id": 19250,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964450.615, "dur": 1.124, "args": { "External id": 19251,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1842 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964451.098, "dur": 0.564, "args": { "External id": 19252,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1843 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964455.744, "dur": 3.914, "args": { "External id": 19253,"Record function id": 0, "Ev Idx": 1844 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295650964457.122, "dur": 2.142, "args": { "External id": 19254,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964457.815, "dur": 1.017, "args": { "External id": 19255,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1846 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295650964458.222, "dur": 0.520, "args": { "External id": 19256,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1847 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650964463.679, "dur": 39070.679, "args": { "External id": 19257,"Record function id": 0, "Sequence number": 246593, "Fwd thread id": 1, "Ev Idx": 1848 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295650964464.878, "dur": 39060.844, "args": { "External id": 19258,"Sequence number": 246593, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1849 } }, { "ph": "f", "id": 175, "pid": 1336759, "tid": 1381173, "ts": 1295650964464.878, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.26)", "pid": 1336759, "tid": 1381173, "ts": 1295650964493.539, "dur": 39.297, "args": { "External id": 19259,"Record function id": 0, "Ev Idx": 1850 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.26)", "pid": 1336759, "tid": 1381173, "ts": 1295650964540.888, "dur": 59.355, "args": { "External id": 19260,"Record function id": 0, "Ev Idx": 1851 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.26)", "pid": 1336759, "tid": 1381173, "ts": 1295650964605.621, "dur": 38912.117, "args": { "External id": 19261,"Record function id": 0, "Ev Idx": 1852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650964693.862, "dur": 6.673, "args": { "External id": 19262,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295650964709.766, "dur": 4.742, "args": { "External id": 19263,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 1854 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295650964729.817, "dur": 37846.128, "args": { "External id": 19264,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 1855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295650964743.101, "dur": 37823.178, "args": { "External id": 19265,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 1856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295650964791.283, "dur": 14.680, "args": { "External id": 19266,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295650964812.811, "dur": 37714.727, "args": { "External id": 19267,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 1858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295650964815.585, "dur": 37711.197, "args": { "External id": 19268,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 1859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295650964819.981, "dur": 4.822, "args": { "External id": 19269,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295650964826.742, "dur": 37696.311, "args": { "External id": 19270,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 1861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651002670.209, "dur": 9.443, "args": { "External id": 19271,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 1862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651002673.662, "dur": 5.625, "args": { "External id": 19272,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1863 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651002709.574, "dur": 469.943, "args": { "External id": 19273,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 1864 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651002737.002, "dur": 435.498, "args": { "External id": 19274,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1865, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651002748.902, "dur": 416.491, "args": { "External id": 19275,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 1866 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651003205.638, "dur": 2.169, "args": { "External id": 19276,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1867, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651003296.880, "dur": 7.947, "args": { "External id": 19277,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651003352.711, "dur": 1.460, "args": { "External id": 19278,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651003371.082, "dur": 1.069, "args": { "External id": 19279,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651003386.457, "dur": 1.274, "args": { "External id": 19280,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651003399.818, "dur": 0.744, "args": { "External id": 19281,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651003412.123, "dur": 1.011, "args": { "External id": 19282,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651003425.010, "dur": 1.172, "args": { "External id": 19283,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651003438.970, "dur": 2.313, "args": { "External id": 19284,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651003452.423, "dur": 0.989, "args": { "External id": 19285,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1876 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651003550.521, "dur": 2746.954, "args": { "External id": 19286,"Record function id": 0, "Ev Idx": 1877 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.25)", "pid": 1336759, "tid": 1381173, "ts": 1295651003569.449, "dur": 1050.400, "args": { "External id": 19287,"Record function id": 0, "Ev Idx": 1878 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.25)", "pid": 1336759, "tid": 1381173, "ts": 1295651003588.014, "dur": 315.244, "args": { "External id": 19288,"Record function id": 0, "Ev Idx": 1879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651003662.403, "dur": 4.179, "args": { "External id": 19289,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 1880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651003669.915, "dur": 1.205, "args": { "External id": 19290,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 1881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651003673.086, "dur": 1.014, "args": { "External id": 19291,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651003675.935, "dur": 1.594, "args": { "External id": 19292,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651003679.237, "dur": 0.909, "args": { "External id": 19293,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651003681.829, "dur": 0.846, "args": { "External id": 19294,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651003684.208, "dur": 2.043, "args": { "External id": 19295,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 1886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651003687.585, "dur": 1.076, "args": { "External id": 19296,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651003690.009, "dur": 0.631, "args": { "External id": 19297,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651003691.984, "dur": 0.938, "args": { "External id": 19298,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1889 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651003710.890, "dur": 160.110, "args": { "External id": 19299,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 1890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651003726.986, "dur": 139.179, "args": { "External id": 19300,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 1891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651003751.825, "dur": 13.599, "args": { "External id": 19301,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651003768.736, "dur": 70.301, "args": { "External id": 19302,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 1893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651003771.678, "dur": 66.965, "args": { "External id": 19303,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 1894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651003775.970, "dur": 7.720, "args": { "External id": 19304,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651003785.561, "dur": 52.278, "args": { "External id": 19305,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 1896 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.24", "pid": 1336759, "tid": 1381173, "ts": 1295651003980.257, "dur": 631.189, "args": { "External id": 19306,"Record function id": 0, "Ev Idx": 1897 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.24)", "pid": 1336759, "tid": 1381173, "ts": 1295651004040.462, "dur": 557.132, "args": { "External id": 19307,"Record function id": 0, "Ev Idx": 1898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651004102.023, "dur": 7.085, "args": { "External id": 19308,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651004125.232, "dur": 31.562, "args": { "External id": 19309,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004130.917, "dur": 1.597, "args": { "External id": 19310,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004134.686, "dur": 0.335, "args": { "External id": 19311,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004136.580, "dur": 0.431, "args": { "External id": 19312,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004138.859, "dur": 0.424, "args": { "External id": 19313,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004142.061, "dur": 0.346, "args": { "External id": 19314,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004144.338, "dur": 0.557, "args": { "External id": 19315,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004146.483, "dur": 1.508, "args": { "External id": 19316,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004149.906, "dur": 0.433, "args": { "External id": 19317,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004151.894, "dur": 0.437, "args": { "External id": 19318,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651004166.488, "dur": 33.160, "args": { "External id": 19319,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1910 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651004250.820, "dur": 120.226, "args": { "External id": 19320,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 1911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651004262.398, "dur": 4.833, "args": { "External id": 19321,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651004272.581, "dur": 11.281, "args": { "External id": 19322,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651004276.965, "dur": 6.448, "args": { "External id": 19323,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 1914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004281.176, "dur": 0.728, "args": { "External id": 19324,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651004291.796, "dur": 37.559, "args": { "External id": 19325,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004294.416, "dur": 0.444, "args": { "External id": 19326,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004296.838, "dur": 0.704, "args": { "External id": 19327,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004310.800, "dur": 0.581, "args": { "External id": 19328,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004313.904, "dur": 0.993, "args": { "External id": 19329,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004316.600, "dur": 0.410, "args": { "External id": 19330,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004318.581, "dur": 0.309, "args": { "External id": 19331,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004320.606, "dur": 0.279, "args": { "External id": 19332,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004322.489, "dur": 0.466, "args": { "External id": 19333,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651004324.714, "dur": 0.340, "args": { "External id": 19334,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651004340.511, "dur": 22.276, "args": { "External id": 19335,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1926 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651004419.665, "dur": 111.034, "args": { "External id": 19336,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 1927 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651004442.261, "dur": 84.808, "args": { "External id": 19337,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1928, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651004452.494, "dur": 70.261, "args": { "External id": 19338,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 1929 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651004546.954, "dur": 1.749, "args": { "External id": 19339,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1930, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651004627.331, "dur": 1649.905, "args": { "External id": 19340,"Sequence number": 246592, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1931 } }, { "ph": "f", "id": 176, "pid": 1336759, "tid": 1381173, "ts": 1295651004627.331, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651004732.090, "dur": 101.927, "args": { "External id": 19341,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 1932 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651004871.395, "dur": 36.712, "args": { "External id": 19342,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 1933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651004925.339, "dur": 49.352, "args": { "External id": 19343,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 1934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651004983.810, "dur": 79.588, "args": { "External id": 19344,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651005075.956, "dur": 46.137, "args": { "External id": 19345,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651005130.052, "dur": 28.163, "args": { "External id": 19346,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651005174.264, "dur": 43.006, "args": { "External id": 19347,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1938 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651005262.162, "dur": 25.453, "args": { "External id": 19348,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 1939 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651005307.472, "dur": 26.830, "args": { "External id": 19349,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1940 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651005355.811, "dur": 19.678, "args": { "External id": 19350,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1941 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651005393.566, "dur": 14.383, "args": { "External id": 19351,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651005417.393, "dur": 32.043, "args": { "External id": 19352,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651005453.207, "dur": 34.425, "args": { "External id": 19353,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1944 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651005515.040, "dur": 169.871, "args": { "External id": 19354,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651005596.539, "dur": 6.445, "args": { "External id": 19355,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651005605.476, "dur": 2.223, "args": { "External id": 19356,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1947 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651005716.172, "dur": 24.879, "args": { "External id": 19357,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1948 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651005752.748, "dur": 14.483, "args": { "External id": 19358,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651005776.276, "dur": 35.893, "args": { "External id": 19359,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651005819.088, "dur": 35.673, "args": { "External id": 19360,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651005862.873, "dur": 20.532, "args": { "External id": 19361,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651005888.931, "dur": 43.602, "args": { "External id": 19362,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651005945.093, "dur": 23.975, "args": { "External id": 19363,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651005976.803, "dur": 71.832, "args": { "External id": 19364,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1955 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651006072.334, "dur": 27.489, "args": { "External id": 19365,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 1956 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651006117.639, "dur": 23.418, "args": { "External id": 19366,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1957 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651006155.414, "dur": 16.810, "args": { "External id": 19367,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1958 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651006186.280, "dur": 14.714, "args": { "External id": 19368,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1959 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651006214.616, "dur": 29.560, "args": { "External id": 19369,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 1960 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006320.193, "dur": 15.319, "args": { "External id": 19370,"Record function id": 0, "Ev Idx": 1961 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006323.384, "dur": 11.152, "args": { "External id": 19371,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006327.729, "dur": 5.978, "args": { "External id": 19372,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1963 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006329.502, "dur": 4.053, "args": { "External id": 19373,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1964 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006339.269, "dur": 5.597, "args": { "External id": 19374,"Record function id": 0, "Ev Idx": 1965 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006340.729, "dur": 3.627, "args": { "External id": 19375,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006341.545, "dur": 2.266, "args": { "External id": 19376,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1967 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006342.718, "dur": 0.917, "args": { "External id": 19377,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1968 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006348.073, "dur": 4.861, "args": { "External id": 19378,"Record function id": 0, "Ev Idx": 1969 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006349.485, "dur": 3.031, "args": { "External id": 19379,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006350.189, "dur": 1.866, "args": { "External id": 19380,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1971 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006350.879, "dur": 1.096, "args": { "External id": 19381,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1972 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006356.053, "dur": 5.351, "args": { "External id": 19382,"Record function id": 0, "Ev Idx": 1973 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006357.369, "dur": 3.646, "args": { "External id": 19383,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006357.831, "dur": 2.780, "args": { "External id": 19384,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1975 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006358.564, "dur": 1.971, "args": { "External id": 19385,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1976 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006364.459, "dur": 4.240, "args": { "External id": 19386,"Record function id": 0, "Ev Idx": 1977 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006365.735, "dur": 2.576, "args": { "External id": 19387,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006366.191, "dur": 1.718, "args": { "External id": 19388,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1979 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006366.805, "dur": 1.014, "args": { "External id": 19389,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1980 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006371.779, "dur": 3.822, "args": { "External id": 19390,"Record function id": 0, "Ev Idx": 1981 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006372.906, "dur": 2.306, "args": { "External id": 19391,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006373.512, "dur": 1.277, "args": { "External id": 19392,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1983 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006374.197, "dur": 0.472, "args": { "External id": 19393,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1984 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006378.987, "dur": 3.818, "args": { "External id": 19394,"Record function id": 0, "Ev Idx": 1985 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006380.179, "dur": 2.237, "args": { "External id": 19395,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006380.912, "dur": 1.081, "args": { "External id": 19396,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1987 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006381.200, "dur": 0.690, "args": { "External id": 19397,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1988 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006385.933, "dur": 3.730, "args": { "External id": 19398,"Record function id": 0, "Ev Idx": 1989 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006387.043, "dur": 2.231, "args": { "External id": 19399,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006387.569, "dur": 1.232, "args": { "External id": 19400,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1991 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006388.134, "dur": 0.595, "args": { "External id": 19401,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1992 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006392.713, "dur": 3.789, "args": { "External id": 19402,"Record function id": 0, "Ev Idx": 1993 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651006394.017, "dur": 2.098, "args": { "External id": 19403,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006394.617, "dur": 1.083, "args": { "External id": 19404,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1995 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651006395.154, "dur": 0.446, "args": { "External id": 19405,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1996 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651006399.924, "dur": 37427.403, "args": { "External id": 19406,"Record function id": 0, "Sequence number": 246591, "Fwd thread id": 1, "Ev Idx": 1997 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651006401.149, "dur": 37417.761, "args": { "External id": 19407,"Sequence number": 246591, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1998 } }, { "ph": "f", "id": 177, "pid": 1336759, "tid": 1381173, "ts": 1295651006401.149, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.25)", "pid": 1336759, "tid": 1381173, "ts": 1295651006431.152, "dur": 38.106, "args": { "External id": 19408,"Record function id": 0, "Ev Idx": 1999 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.25)", "pid": 1336759, "tid": 1381173, "ts": 1295651006477.058, "dur": 59.736, "args": { "External id": 19409,"Record function id": 0, "Ev Idx": 2000 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.25)", "pid": 1336759, "tid": 1381173, "ts": 1295651006542.816, "dur": 37268.677, "args": { "External id": 19410,"Record function id": 0, "Ev Idx": 2001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651006629.875, "dur": 6.926, "args": { "External id": 19411,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651006646.580, "dur": 4.991, "args": { "External id": 19412,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2003 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651006666.724, "dur": 36349.395, "args": { "External id": 19413,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651006680.260, "dur": 36325.772, "args": { "External id": 19414,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651006728.197, "dur": 14.511, "args": { "External id": 19415,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651006749.557, "dur": 36196.236, "args": { "External id": 19416,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651006752.370, "dur": 36192.639, "args": { "External id": 19417,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651006756.527, "dur": 4.605, "args": { "External id": 19418,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651006762.968, "dur": 36178.180, "args": { "External id": 19419,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651043108.529, "dur": 9.475, "args": { "External id": 19420,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651043112.053, "dur": 5.494, "args": { "External id": 19421,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2012 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651043147.786, "dur": 362.801, "args": { "External id": 19422,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2013 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651043174.927, "dur": 330.210, "args": { "External id": 19423,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2014, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651043187.140, "dur": 312.038, "args": { "External id": 19424,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2015 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651043532.961, "dur": 2.078, "args": { "External id": 19425,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2016, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651043595.976, "dur": 7.000, "args": { "External id": 19426,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651043649.322, "dur": 1.683, "args": { "External id": 19427,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2018 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651043669.448, "dur": 1.014, "args": { "External id": 19428,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651043684.152, "dur": 1.007, "args": { "External id": 19429,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651043697.210, "dur": 0.848, "args": { "External id": 19430,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651043709.829, "dur": 0.966, "args": { "External id": 19431,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651043721.975, "dur": 1.275, "args": { "External id": 19432,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651043736.605, "dur": 1.981, "args": { "External id": 19433,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651043749.556, "dur": 0.775, "args": { "External id": 19434,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2025 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651043841.279, "dur": 2726.913, "args": { "External id": 19435,"Record function id": 0, "Ev Idx": 2026 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.24)", "pid": 1336759, "tid": 1381173, "ts": 1295651043859.662, "dur": 1044.087, "args": { "External id": 19436,"Record function id": 0, "Ev Idx": 2027 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.24)", "pid": 1336759, "tid": 1381173, "ts": 1295651043875.493, "dur": 371.343, "args": { "External id": 19437,"Record function id": 0, "Ev Idx": 2028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651043948.102, "dur": 4.363, "args": { "External id": 19438,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651043955.774, "dur": 1.144, "args": { "External id": 19439,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651043958.803, "dur": 0.898, "args": { "External id": 19440,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651043961.226, "dur": 1.877, "args": { "External id": 19441,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651043964.577, "dur": 0.949, "args": { "External id": 19442,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651043967.260, "dur": 0.740, "args": { "External id": 19443,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651043969.891, "dur": 1.859, "args": { "External id": 19444,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651043973.211, "dur": 1.257, "args": { "External id": 19445,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651043975.873, "dur": 0.963, "args": { "External id": 19446,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651043978.641, "dur": 0.857, "args": { "External id": 19447,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2038 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651044036.711, "dur": 160.231, "args": { "External id": 19448,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651044053.503, "dur": 138.731, "args": { "External id": 19449,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651044079.286, "dur": 12.822, "args": { "External id": 19450,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651044095.637, "dur": 69.351, "args": { "External id": 19451,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651044098.355, "dur": 66.250, "args": { "External id": 19452,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044102.366, "dur": 8.310, "args": { "External id": 19453,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651044112.631, "dur": 51.531, "args": { "External id": 19454,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2045 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.23", "pid": 1336759, "tid": 1381173, "ts": 1295651044331.626, "dur": 563.485, "args": { "External id": 19455,"Record function id": 0, "Ev Idx": 2046 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.23)", "pid": 1336759, "tid": 1381173, "ts": 1295651044351.470, "dur": 530.357, "args": { "External id": 19456,"Record function id": 0, "Ev Idx": 2047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651044429.883, "dur": 5.956, "args": { "External id": 19457,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651044452.649, "dur": 31.722, "args": { "External id": 19458,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044458.413, "dur": 1.937, "args": { "External id": 19459,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044463.118, "dur": 0.419, "args": { "External id": 19460,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044465.511, "dur": 0.417, "args": { "External id": 19461,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044467.978, "dur": 0.346, "args": { "External id": 19462,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044469.735, "dur": 0.376, "args": { "External id": 19463,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044471.976, "dur": 0.395, "args": { "External id": 19464,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044474.355, "dur": 1.344, "args": { "External id": 19465,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044477.247, "dur": 0.392, "args": { "External id": 19466,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044479.111, "dur": 0.406, "args": { "External id": 19467,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651044494.112, "dur": 34.790, "args": { "External id": 19468,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2059 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651044560.379, "dur": 98.741, "args": { "External id": 19469,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651044570.482, "dur": 3.271, "args": { "External id": 19470,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651044578.771, "dur": 10.689, "args": { "External id": 19471,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651044582.970, "dur": 6.048, "args": { "External id": 19472,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044587.063, "dur": 0.608, "args": { "External id": 19473,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651044596.638, "dur": 24.084, "args": { "External id": 19474,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044598.974, "dur": 0.355, "args": { "External id": 19475,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044600.996, "dur": 0.414, "args": { "External id": 19476,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044603.169, "dur": 0.378, "args": { "External id": 19477,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044605.178, "dur": 1.238, "args": { "External id": 19478,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044608.006, "dur": 0.440, "args": { "External id": 19479,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044610.290, "dur": 0.398, "args": { "External id": 19480,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044612.652, "dur": 0.312, "args": { "External id": 19481,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044614.666, "dur": 0.381, "args": { "External id": 19482,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651044616.787, "dur": 0.355, "args": { "External id": 19483,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651044632.994, "dur": 18.533, "args": { "External id": 19484,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2075 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651044703.966, "dur": 110.496, "args": { "External id": 19485,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2076 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651044726.235, "dur": 84.859, "args": { "External id": 19486,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2077, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651044736.482, "dur": 70.510, "args": { "External id": 19487,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2078 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651044828.879, "dur": 1.818, "args": { "External id": 19488,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2079, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651044911.384, "dur": 1637.003, "args": { "External id": 19489,"Sequence number": 246590, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2080 } }, { "ph": "f", "id": 178, "pid": 1336759, "tid": 1381173, "ts": 1295651044911.384, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651045060.244, "dur": 106.194, "args": { "External id": 19490,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2081 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651045207.237, "dur": 55.712, "args": { "External id": 19491,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651045282.065, "dur": 52.248, "args": { "External id": 19492,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651045344.016, "dur": 33.171, "args": { "External id": 19493,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651045385.639, "dur": 44.937, "args": { "External id": 19494,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651045437.936, "dur": 27.852, "args": { "External id": 19495,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651045473.014, "dur": 42.138, "args": { "External id": 19496,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2087 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651045537.796, "dur": 21.786, "args": { "External id": 19497,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2088 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651045579.870, "dur": 26.811, "args": { "External id": 19498,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2089 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651045625.617, "dur": 18.754, "args": { "External id": 19499,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2090 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651045657.665, "dur": 14.738, "args": { "External id": 19500,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651045680.622, "dur": 27.869, "args": { "External id": 19501,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651045711.809, "dur": 32.127, "args": { "External id": 19502,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2093 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651045784.271, "dur": 169.484, "args": { "External id": 19503,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651045864.063, "dur": 5.272, "args": { "External id": 19504,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651045871.433, "dur": 2.211, "args": { "External id": 19505,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2096 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651046018.473, "dur": 28.842, "args": { "External id": 19506,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2097 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651046061.392, "dur": 14.374, "args": { "External id": 19507,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651046086.249, "dur": 41.268, "args": { "External id": 19508,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651046134.940, "dur": 35.318, "args": { "External id": 19509,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651046179.857, "dur": 21.516, "args": { "External id": 19510,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651046207.481, "dur": 43.191, "args": { "External id": 19511,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651046260.268, "dur": 23.452, "args": { "External id": 19512,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651046291.767, "dur": 40.657, "args": { "External id": 19513,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2104 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651046357.666, "dur": 26.120, "args": { "External id": 19514,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2105 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651046401.582, "dur": 23.300, "args": { "External id": 19515,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2106 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651046438.196, "dur": 17.390, "args": { "External id": 19516,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2107 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651046470.122, "dur": 18.616, "args": { "External id": 19517,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2108 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651046501.704, "dur": 15.199, "args": { "External id": 19518,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2109 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046591.278, "dur": 15.025, "args": { "External id": 19519,"Record function id": 0, "Ev Idx": 2110 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046594.377, "dur": 10.971, "args": { "External id": 19520,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046598.387, "dur": 5.930, "args": { "External id": 19521,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2112 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046600.160, "dur": 3.997, "args": { "External id": 19522,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2113 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046610.148, "dur": 5.273, "args": { "External id": 19523,"Record function id": 0, "Ev Idx": 2114 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046611.801, "dur": 3.200, "args": { "External id": 19524,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046612.668, "dur": 1.833, "args": { "External id": 19525,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2116 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046613.385, "dur": 0.984, "args": { "External id": 19526,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2117 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046618.885, "dur": 4.899, "args": { "External id": 19527,"Record function id": 0, "Ev Idx": 2118 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046620.481, "dur": 2.900, "args": { "External id": 19528,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046621.058, "dur": 1.898, "args": { "External id": 19529,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2120 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046621.781, "dur": 1.084, "args": { "External id": 19530,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2121 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046626.934, "dur": 5.367, "args": { "External id": 19531,"Record function id": 0, "Ev Idx": 2122 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046628.648, "dur": 3.271, "args": { "External id": 19532,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046629.286, "dur": 2.226, "args": { "External id": 19533,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2124 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046629.773, "dur": 1.674, "args": { "External id": 19534,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2125 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046635.428, "dur": 3.646, "args": { "External id": 19535,"Record function id": 0, "Ev Idx": 2126 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046636.625, "dur": 2.061, "args": { "External id": 19536,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046637.112, "dur": 1.191, "args": { "External id": 19537,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2128 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046637.390, "dur": 0.811, "args": { "External id": 19538,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2129 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046642.186, "dur": 3.496, "args": { "External id": 19539,"Record function id": 0, "Ev Idx": 2130 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046643.389, "dur": 1.891, "args": { "External id": 19540,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046643.831, "dur": 1.061, "args": { "External id": 19541,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2132 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046644.225, "dur": 0.524, "args": { "External id": 19542,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2133 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046648.917, "dur": 3.950, "args": { "External id": 19543,"Record function id": 0, "Ev Idx": 2134 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046650.043, "dur": 2.430, "args": { "External id": 19544,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046650.598, "dur": 1.419, "args": { "External id": 19545,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2136 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046651.153, "dur": 0.750, "args": { "External id": 19546,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2137 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046655.889, "dur": 3.923, "args": { "External id": 19547,"Record function id": 0, "Ev Idx": 2138 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046657.106, "dur": 2.296, "args": { "External id": 19548,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046658.020, "dur": 0.988, "args": { "External id": 19549,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2140 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046658.410, "dur": 0.510, "args": { "External id": 19550,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2141 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046662.757, "dur": 3.852, "args": { "External id": 19551,"Record function id": 0, "Ev Idx": 2142 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651046663.885, "dur": 2.335, "args": { "External id": 19552,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046664.543, "dur": 1.273, "args": { "External id": 19553,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2144 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651046665.259, "dur": 0.434, "args": { "External id": 19554,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2145 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651046670.200, "dur": 38352.511, "args": { "External id": 19555,"Record function id": 0, "Sequence number": 246589, "Fwd thread id": 1, "Ev Idx": 2146 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651046671.538, "dur": 38306.515, "args": { "External id": 19556,"Sequence number": 246589, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2147 } }, { "ph": "f", "id": 179, "pid": 1336759, "tid": 1381173, "ts": 1295651046671.538, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.24)", "pid": 1336759, "tid": 1381173, "ts": 1295651046700.246, "dur": 37.071, "args": { "External id": 19557,"Record function id": 0, "Ev Idx": 2148 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.24)", "pid": 1336759, "tid": 1381173, "ts": 1295651046745.511, "dur": 60.854, "args": { "External id": 19558,"Record function id": 0, "Ev Idx": 2149 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.24)", "pid": 1336759, "tid": 1381173, "ts": 1295651046812.249, "dur": 38157.926, "args": { "External id": 19559,"Record function id": 0, "Ev Idx": 2150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651046900.899, "dur": 6.174, "args": { "External id": 19560,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651046916.492, "dur": 4.558, "args": { "External id": 19561,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2152 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651046936.316, "dur": 37255.156, "args": { "External id": 19562,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651046949.516, "dur": 37232.225, "args": { "External id": 19563,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651047041.149, "dur": 15.629, "args": { "External id": 19564,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651047063.445, "dur": 37078.514, "args": { "External id": 19565,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651047066.229, "dur": 37074.879, "args": { "External id": 19566,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651047070.482, "dur": 5.922, "args": { "External id": 19567,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651047078.484, "dur": 37059.023, "args": { "External id": 19568,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651084302.807, "dur": 10.336, "args": { "External id": 19569,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651084306.506, "dur": 6.107, "args": { "External id": 19570,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2161 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651084342.794, "dur": 330.479, "args": { "External id": 19571,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2162 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651084372.711, "dur": 295.362, "args": { "External id": 19572,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2163, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651084384.395, "dur": 276.774, "args": { "External id": 19573,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2164 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651084692.732, "dur": 2.044, "args": { "External id": 19574,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2165, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651084754.597, "dur": 6.596, "args": { "External id": 19575,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651084806.812, "dur": 1.458, "args": { "External id": 19576,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651084825.285, "dur": 1.169, "args": { "External id": 19577,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651084840.413, "dur": 1.428, "args": { "External id": 19578,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651084855.481, "dur": 1.134, "args": { "External id": 19579,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651084868.754, "dur": 1.020, "args": { "External id": 19580,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651084881.410, "dur": 1.057, "args": { "External id": 19581,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651084895.420, "dur": 1.893, "args": { "External id": 19582,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651084908.741, "dur": 0.947, "args": { "External id": 19583,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2174 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651085040.498, "dur": 2663.464, "args": { "External id": 19584,"Record function id": 0, "Ev Idx": 2175 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.23)", "pid": 1336759, "tid": 1381173, "ts": 1295651085061.257, "dur": 1010.902, "args": { "External id": 19585,"Record function id": 0, "Ev Idx": 2176 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.23)", "pid": 1336759, "tid": 1381173, "ts": 1295651085078.267, "dur": 343.663, "args": { "External id": 19586,"Record function id": 0, "Ev Idx": 2177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651085155.112, "dur": 4.543, "args": { "External id": 19587,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651085162.974, "dur": 1.087, "args": { "External id": 19588,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651085165.910, "dur": 1.138, "args": { "External id": 19589,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651085168.929, "dur": 1.658, "args": { "External id": 19590,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651085171.904, "dur": 0.749, "args": { "External id": 19591,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651085174.370, "dur": 0.984, "args": { "External id": 19592,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651085176.896, "dur": 1.653, "args": { "External id": 19593,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651085180.063, "dur": 0.678, "args": { "External id": 19594,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651085182.163, "dur": 0.971, "args": { "External id": 19595,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651085184.774, "dur": 0.805, "args": { "External id": 19596,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2187 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651085204.439, "dur": 178.945, "args": { "External id": 19597,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651085219.727, "dur": 158.385, "args": { "External id": 19598,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651085258.923, "dur": 12.815, "args": { "External id": 19599,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651085275.891, "dur": 71.588, "args": { "External id": 19600,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651085278.286, "dur": 68.870, "args": { "External id": 19601,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085282.908, "dur": 7.154, "args": { "External id": 19602,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651085291.989, "dur": 54.735, "args": { "External id": 19603,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2194 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.22", "pid": 1336759, "tid": 1381173, "ts": 1295651085499.431, "dur": 565.022, "args": { "External id": 19604,"Record function id": 0, "Ev Idx": 2195 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.22)", "pid": 1336759, "tid": 1381173, "ts": 1295651085516.681, "dur": 534.264, "args": { "External id": 19605,"Record function id": 0, "Ev Idx": 2196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651085570.483, "dur": 4.816, "args": { "External id": 19606,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651085590.764, "dur": 32.573, "args": { "External id": 19607,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085596.160, "dur": 1.562, "args": { "External id": 19608,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085600.279, "dur": 0.472, "args": { "External id": 19609,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085602.765, "dur": 0.451, "args": { "External id": 19610,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085604.993, "dur": 0.522, "args": { "External id": 19611,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085607.547, "dur": 0.391, "args": { "External id": 19612,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085609.509, "dur": 0.627, "args": { "External id": 19613,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085611.923, "dur": 1.284, "args": { "External id": 19614,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085615.052, "dur": 0.428, "args": { "External id": 19615,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085617.367, "dur": 0.278, "args": { "External id": 19616,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651085633.727, "dur": 27.669, "args": { "External id": 19617,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2208 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651085692.976, "dur": 97.096, "args": { "External id": 19618,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651085703.037, "dur": 2.922, "args": { "External id": 19619,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651085711.197, "dur": 11.093, "args": { "External id": 19620,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651085715.853, "dur": 5.996, "args": { "External id": 19621,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085720.009, "dur": 0.521, "args": { "External id": 19622,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651085729.252, "dur": 25.458, "args": { "External id": 19623,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085731.452, "dur": 0.396, "args": { "External id": 19624,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085734.186, "dur": 0.439, "args": { "External id": 19625,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085736.530, "dur": 0.356, "args": { "External id": 19626,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085738.358, "dur": 1.361, "args": { "External id": 19627,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085741.690, "dur": 0.407, "args": { "External id": 19628,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085743.883, "dur": 0.361, "args": { "External id": 19629,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085746.016, "dur": 0.401, "args": { "External id": 19630,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085748.157, "dur": 0.339, "args": { "External id": 19631,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651085750.225, "dur": 0.350, "args": { "External id": 19632,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651085764.088, "dur": 18.589, "args": { "External id": 19633,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2224 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651085834.747, "dur": 108.519, "args": { "External id": 19634,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2225 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651085856.973, "dur": 82.782, "args": { "External id": 19635,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2226, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651085866.998, "dur": 68.597, "args": { "External id": 19636,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2227 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651085956.304, "dur": 1.762, "args": { "External id": 19637,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2228, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651086079.468, "dur": 1605.181, "args": { "External id": 19638,"Sequence number": 246588, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2229 } }, { "ph": "f", "id": 180, "pid": 1336759, "tid": 1381173, "ts": 1295651086079.468, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651086185.766, "dur": 123.945, "args": { "External id": 19639,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2230 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651086352.005, "dur": 36.811, "args": { "External id": 19640,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651086406.060, "dur": 49.668, "args": { "External id": 19641,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651086464.414, "dur": 32.655, "args": { "External id": 19642,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651086505.505, "dur": 44.232, "args": { "External id": 19643,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651086557.363, "dur": 27.748, "args": { "External id": 19644,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651086593.060, "dur": 42.184, "args": { "External id": 19645,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2236 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651086656.763, "dur": 20.662, "args": { "External id": 19646,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2237 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651086698.141, "dur": 26.131, "args": { "External id": 19647,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2238 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651086742.291, "dur": 18.390, "args": { "External id": 19648,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2239 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651086774.205, "dur": 14.534, "args": { "External id": 19649,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651086797.257, "dur": 28.262, "args": { "External id": 19650,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651086829.017, "dur": 32.118, "args": { "External id": 19651,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2242 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651086887.767, "dur": 210.422, "args": { "External id": 19652,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651086964.019, "dur": 6.043, "args": { "External id": 19653,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651086972.377, "dur": 2.151, "args": { "External id": 19654,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2245 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651087131.385, "dur": 24.517, "args": { "External id": 19655,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2246 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651087167.484, "dur": 14.439, "args": { "External id": 19656,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651087190.919, "dur": 57.454, "args": { "External id": 19657,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651087258.064, "dur": 39.199, "args": { "External id": 19658,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651087329.901, "dur": 23.226, "args": { "External id": 19659,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651087359.206, "dur": 29.994, "args": { "External id": 19660,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651087396.345, "dur": 20.233, "args": { "External id": 19661,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651087435.525, "dur": 39.928, "args": { "External id": 19662,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2253 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651087495.579, "dur": 22.868, "args": { "External id": 19663,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2254 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651087539.202, "dur": 23.241, "args": { "External id": 19664,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2255 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651087576.248, "dur": 20.337, "args": { "External id": 19665,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2256 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651087612.741, "dur": 15.242, "args": { "External id": 19666,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2257 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651087640.924, "dur": 15.118, "args": { "External id": 19667,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2258 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087726.959, "dur": 15.652, "args": { "External id": 19668,"Record function id": 0, "Ev Idx": 2259 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087730.146, "dur": 11.421, "args": { "External id": 19669,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087734.453, "dur": 6.268, "args": { "External id": 19670,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2261 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087736.422, "dur": 4.140, "args": { "External id": 19671,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2262 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087746.630, "dur": 5.154, "args": { "External id": 19672,"Record function id": 0, "Ev Idx": 2263 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087747.956, "dur": 3.377, "args": { "External id": 19673,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087748.652, "dur": 2.255, "args": { "External id": 19674,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2265 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087749.625, "dur": 1.163, "args": { "External id": 19675,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2266 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087755.066, "dur": 3.817, "args": { "External id": 19676,"Record function id": 0, "Ev Idx": 2267 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087756.340, "dur": 2.151, "args": { "External id": 19677,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087756.852, "dur": 1.248, "args": { "External id": 19678,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2269 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087757.184, "dur": 0.811, "args": { "External id": 19679,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2270 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087762.072, "dur": 4.761, "args": { "External id": 19680,"Record function id": 0, "Ev Idx": 2271 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087763.342, "dur": 3.102, "args": { "External id": 19681,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087764.080, "dur": 1.964, "args": { "External id": 19682,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2273 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087764.427, "dur": 1.537, "args": { "External id": 19683,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2274 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087770.051, "dur": 3.769, "args": { "External id": 19684,"Record function id": 0, "Ev Idx": 2275 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087771.440, "dur": 1.995, "args": { "External id": 19685,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087771.968, "dur": 1.091, "args": { "External id": 19686,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2277 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087772.309, "dur": 0.657, "args": { "External id": 19687,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2278 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087776.954, "dur": 3.489, "args": { "External id": 19688,"Record function id": 0, "Ev Idx": 2279 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087777.977, "dur": 2.065, "args": { "External id": 19689,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087778.479, "dur": 1.193, "args": { "External id": 19690,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2281 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087779.017, "dur": 0.552, "args": { "External id": 19691,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2282 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087783.780, "dur": 3.620, "args": { "External id": 19692,"Record function id": 0, "Ev Idx": 2283 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087785.241, "dur": 1.765, "args": { "External id": 19693,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087785.724, "dur": 0.890, "args": { "External id": 19694,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2285 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087786.016, "dur": 0.504, "args": { "External id": 19695,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2286 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087790.489, "dur": 3.254, "args": { "External id": 19696,"Record function id": 0, "Ev Idx": 2287 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087791.575, "dur": 1.767, "args": { "External id": 19697,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087792.055, "dur": 0.910, "args": { "External id": 19698,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2289 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087792.309, "dur": 0.591, "args": { "External id": 19699,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2290 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087796.773, "dur": 3.622, "args": { "External id": 19700,"Record function id": 0, "Ev Idx": 2291 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651087797.908, "dur": 2.101, "args": { "External id": 19701,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087798.357, "dur": 1.285, "args": { "External id": 19702,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2293 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651087798.853, "dur": 0.688, "args": { "External id": 19703,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2294 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651087804.099, "dur": 36922.597, "args": { "External id": 19704,"Record function id": 0, "Sequence number": 246587, "Fwd thread id": 1, "Ev Idx": 2295 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651087805.409, "dur": 36912.323, "args": { "External id": 19705,"Sequence number": 246587, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2296 } }, { "ph": "f", "id": 181, "pid": 1336759, "tid": 1381173, "ts": 1295651087805.409, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.23)", "pid": 1336759, "tid": 1381173, "ts": 1295651087834.484, "dur": 35.065, "args": { "External id": 19706,"Record function id": 0, "Ev Idx": 2297 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.23)", "pid": 1336759, "tid": 1381173, "ts": 1295651087877.693, "dur": 61.329, "args": { "External id": 19707,"Record function id": 0, "Ev Idx": 2298 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.23)", "pid": 1336759, "tid": 1381173, "ts": 1295651087945.261, "dur": 36763.815, "args": { "External id": 19708,"Record function id": 0, "Ev Idx": 2299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651088079.841, "dur": 7.662, "args": { "External id": 19709,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651088099.156, "dur": 5.028, "args": { "External id": 19710,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2301 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651088124.017, "dur": 35744.560, "args": { "External id": 19711,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651088137.428, "dur": 35719.421, "args": { "External id": 19712,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651088179.719, "dur": 15.640, "args": { "External id": 19713,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651088201.883, "dur": 35611.577, "args": { "External id": 19714,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651088204.719, "dur": 35607.428, "args": { "External id": 19715,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651088209.114, "dur": 4.969, "args": { "External id": 19716,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651088216.053, "dur": 35591.952, "args": { "External id": 19717,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651123972.919, "dur": 37.147, "args": { "External id": 19718,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651123976.644, "dur": 32.624, "args": { "External id": 19719,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2310 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651124043.820, "dur": 367.970, "args": { "External id": 19720,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2311 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651124073.064, "dur": 333.269, "args": { "External id": 19721,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2312, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651124085.783, "dur": 314.576, "args": { "External id": 19722,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2313 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651124433.805, "dur": 2.350, "args": { "External id": 19723,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2314, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651124499.492, "dur": 6.510, "args": { "External id": 19724,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651124551.866, "dur": 1.320, "args": { "External id": 19725,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651124569.950, "dur": 0.950, "args": { "External id": 19726,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651124583.526, "dur": 1.000, "args": { "External id": 19727,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651124596.065, "dur": 0.910, "args": { "External id": 19728,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651124607.377, "dur": 0.884, "args": { "External id": 19729,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651124618.410, "dur": 0.998, "args": { "External id": 19730,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651124631.144, "dur": 2.375, "args": { "External id": 19731,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651124643.538, "dur": 0.788, "args": { "External id": 19732,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2323 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651124742.091, "dur": 2741.316, "args": { "External id": 19733,"Record function id": 0, "Ev Idx": 2324 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.22)", "pid": 1336759, "tid": 1381173, "ts": 1295651124761.540, "dur": 1038.984, "args": { "External id": 19734,"Record function id": 0, "Ev Idx": 2325 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.22)", "pid": 1336759, "tid": 1381173, "ts": 1295651124777.883, "dur": 361.399, "args": { "External id": 19735,"Record function id": 0, "Ev Idx": 2326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651124852.660, "dur": 4.047, "args": { "External id": 19736,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651124859.880, "dur": 1.022, "args": { "External id": 19737,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651124862.611, "dur": 1.090, "args": { "External id": 19738,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651124865.027, "dur": 1.621, "args": { "External id": 19739,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651124868.265, "dur": 0.817, "args": { "External id": 19740,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651124870.463, "dur": 0.772, "args": { "External id": 19741,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651124872.659, "dur": 2.091, "args": { "External id": 19742,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651124876.221, "dur": 0.910, "args": { "External id": 19743,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651124878.576, "dur": 0.790, "args": { "External id": 19744,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651124880.545, "dur": 0.945, "args": { "External id": 19745,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2336 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651124899.478, "dur": 200.640, "args": { "External id": 19746,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651124914.881, "dur": 179.401, "args": { "External id": 19747,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651124938.431, "dur": 11.983, "args": { "External id": 19748,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651124953.687, "dur": 110.525, "args": { "External id": 19749,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651124956.409, "dur": 107.298, "args": { "External id": 19750,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651124960.286, "dur": 7.775, "args": { "External id": 19751,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651124970.055, "dur": 92.534, "args": { "External id": 19752,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2343 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.21", "pid": 1336759, "tid": 1381173, "ts": 1295651125225.206, "dur": 567.101, "args": { "External id": 19753,"Record function id": 0, "Ev Idx": 2344 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.21)", "pid": 1336759, "tid": 1381173, "ts": 1295651125263.712, "dur": 515.090, "args": { "External id": 19754,"Record function id": 0, "Ev Idx": 2345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651125325.685, "dur": 6.306, "args": { "External id": 19755,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651125350.566, "dur": 29.665, "args": { "External id": 19756,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125355.509, "dur": 1.642, "args": { "External id": 19757,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125359.286, "dur": 0.442, "args": { "External id": 19758,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125361.214, "dur": 0.645, "args": { "External id": 19759,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125363.365, "dur": 0.453, "args": { "External id": 19760,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125365.489, "dur": 0.487, "args": { "External id": 19761,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125367.196, "dur": 0.398, "args": { "External id": 19762,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125369.356, "dur": 1.560, "args": { "External id": 19763,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125372.438, "dur": 0.455, "args": { "External id": 19764,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125374.590, "dur": 0.350, "args": { "External id": 19765,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651125393.793, "dur": 34.467, "args": { "External id": 19766,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2357 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651125459.837, "dur": 99.337, "args": { "External id": 19767,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651125470.893, "dur": 3.364, "args": { "External id": 19768,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651125479.359, "dur": 10.745, "args": { "External id": 19769,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651125483.942, "dur": 5.742, "args": { "External id": 19770,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125487.743, "dur": 0.569, "args": { "External id": 19771,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651125497.454, "dur": 23.394, "args": { "External id": 19772,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125499.957, "dur": 0.555, "args": { "External id": 19773,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125502.049, "dur": 0.530, "args": { "External id": 19774,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125503.919, "dur": 0.444, "args": { "External id": 19775,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125505.760, "dur": 1.450, "args": { "External id": 19776,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125508.682, "dur": 0.389, "args": { "External id": 19777,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125510.481, "dur": 0.581, "args": { "External id": 19778,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125512.582, "dur": 0.339, "args": { "External id": 19779,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125514.686, "dur": 0.407, "args": { "External id": 19780,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651125516.457, "dur": 0.500, "args": { "External id": 19781,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651125532.144, "dur": 19.224, "args": { "External id": 19782,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2373 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651125604.885, "dur": 107.995, "args": { "External id": 19783,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2374 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651125626.337, "dur": 82.785, "args": { "External id": 19784,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2375, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651125636.498, "dur": 68.897, "args": { "External id": 19785,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2376 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651125727.346, "dur": 1.757, "args": { "External id": 19786,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2377, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651125807.041, "dur": 1656.946, "args": { "External id": 19787,"Sequence number": 246586, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2378 } }, { "ph": "f", "id": 182, "pid": 1336759, "tid": 1381173, "ts": 1295651125807.041, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651125909.162, "dur": 148.198, "args": { "External id": 19788,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2379 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651126100.950, "dur": 40.110, "args": { "External id": 19789,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651126158.823, "dur": 57.265, "args": { "External id": 19790,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651126226.843, "dur": 54.105, "args": { "External id": 19791,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651126291.558, "dur": 45.997, "args": { "External id": 19792,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651126345.584, "dur": 27.734, "args": { "External id": 19793,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651126381.481, "dur": 42.204, "args": { "External id": 19794,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2385 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651126448.043, "dur": 23.447, "args": { "External id": 19795,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2386 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651126499.581, "dur": 27.833, "args": { "External id": 19796,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2387 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651126547.374, "dur": 18.953, "args": { "External id": 19797,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2388 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651126581.585, "dur": 14.684, "args": { "External id": 19798,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651126605.355, "dur": 28.761, "args": { "External id": 19799,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651126637.631, "dur": 32.633, "args": { "External id": 19800,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2391 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651126697.842, "dur": 166.043, "args": { "External id": 19801,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651126774.719, "dur": 5.839, "args": { "External id": 19802,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651126782.813, "dur": 2.371, "args": { "External id": 19803,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2394 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651126894.546, "dur": 24.059, "args": { "External id": 19804,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2395 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651126929.772, "dur": 13.585, "args": { "External id": 19805,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651126951.276, "dur": 71.308, "args": { "External id": 19806,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651127033.135, "dur": 39.313, "args": { "External id": 19807,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651127081.502, "dur": 22.090, "args": { "External id": 19808,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651127110.012, "dur": 29.864, "args": { "External id": 19809,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651127146.229, "dur": 21.258, "args": { "External id": 19810,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651127175.855, "dur": 39.592, "args": { "External id": 19811,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2402 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651127257.231, "dur": 30.953, "args": { "External id": 19812,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2403 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651127305.290, "dur": 22.715, "args": { "External id": 19813,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2404 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651127345.244, "dur": 16.162, "args": { "External id": 19814,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2405 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651127375.977, "dur": 17.802, "args": { "External id": 19815,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2406 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651127413.776, "dur": 16.742, "args": { "External id": 19816,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2407 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127506.249, "dur": 16.071, "args": { "External id": 19817,"Record function id": 0, "Ev Idx": 2408 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127509.665, "dur": 11.513, "args": { "External id": 19818,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127513.852, "dur": 6.337, "args": { "External id": 19819,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2410 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127515.799, "dur": 4.266, "args": { "External id": 19820,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2411 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127526.043, "dur": 5.344, "args": { "External id": 19821,"Record function id": 0, "Ev Idx": 2412 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127527.259, "dur": 3.646, "args": { "External id": 19822,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127528.050, "dur": 2.332, "args": { "External id": 19823,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2414 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127528.780, "dur": 1.485, "args": { "External id": 19824,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2415 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127534.478, "dur": 4.120, "args": { "External id": 19825,"Record function id": 0, "Ev Idx": 2416 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127535.719, "dur": 2.478, "args": { "External id": 19826,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127536.336, "dur": 1.457, "args": { "External id": 19827,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2418 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127536.775, "dur": 0.947, "args": { "External id": 19828,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2419 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127541.632, "dur": 3.871, "args": { "External id": 19829,"Record function id": 0, "Ev Idx": 2420 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127542.847, "dur": 2.256, "args": { "External id": 19830,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127543.416, "dur": 1.296, "args": { "External id": 19831,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2422 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127543.815, "dur": 0.836, "args": { "External id": 19832,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2423 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127548.533, "dur": 3.733, "args": { "External id": 19833,"Record function id": 0, "Ev Idx": 2424 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127549.464, "dur": 2.407, "args": { "External id": 19834,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127549.975, "dur": 1.493, "args": { "External id": 19835,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2426 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127550.504, "dur": 0.873, "args": { "External id": 19836,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2427 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127555.344, "dur": 3.943, "args": { "External id": 19837,"Record function id": 0, "Ev Idx": 2428 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127556.487, "dur": 2.392, "args": { "External id": 19838,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127556.937, "dur": 1.529, "args": { "External id": 19839,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2430 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127557.377, "dur": 0.985, "args": { "External id": 19840,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2431 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127562.482, "dur": 3.671, "args": { "External id": 19841,"Record function id": 0, "Ev Idx": 2432 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127563.460, "dur": 2.291, "args": { "External id": 19842,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127564.119, "dur": 1.229, "args": { "External id": 19843,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2434 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127564.564, "dur": 0.723, "args": { "External id": 19844,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2435 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127569.181, "dur": 4.006, "args": { "External id": 19845,"Record function id": 0, "Ev Idx": 2436 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127570.572, "dur": 2.193, "args": { "External id": 19846,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127571.026, "dur": 1.335, "args": { "External id": 19847,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2438 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127571.533, "dur": 0.746, "args": { "External id": 19848,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2439 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127576.174, "dur": 3.487, "args": { "External id": 19849,"Record function id": 0, "Ev Idx": 2440 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651127577.162, "dur": 2.096, "args": { "External id": 19850,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127577.585, "dur": 1.270, "args": { "External id": 19851,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2442 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651127578.004, "dur": 0.773, "args": { "External id": 19852,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2443 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651127583.564, "dur": 35993.945, "args": { "External id": 19853,"Record function id": 0, "Sequence number": 246585, "Fwd thread id": 1, "Ev Idx": 2444 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651127585.030, "dur": 35984.319, "args": { "External id": 19854,"Sequence number": 246585, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2445 } }, { "ph": "f", "id": 183, "pid": 1336759, "tid": 1381173, "ts": 1295651127585.030, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.22)", "pid": 1336759, "tid": 1381173, "ts": 1295651127615.271, "dur": 39.699, "args": { "External id": 19855,"Record function id": 0, "Ev Idx": 2446 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.22)", "pid": 1336759, "tid": 1381173, "ts": 1295651127662.636, "dur": 58.415, "args": { "External id": 19856,"Record function id": 0, "Ev Idx": 2447 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.22)", "pid": 1336759, "tid": 1381173, "ts": 1295651127727.448, "dur": 35834.112, "args": { "External id": 19857,"Record function id": 0, "Ev Idx": 2448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651127815.255, "dur": 6.754, "args": { "External id": 19858,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651127831.166, "dur": 4.725, "args": { "External id": 19859,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2450 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651127850.259, "dur": 34886.194, "args": { "External id": 19860,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651127863.437, "dur": 34863.574, "args": { "External id": 19861,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651127916.039, "dur": 13.770, "args": { "External id": 19862,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651127936.578, "dur": 34751.196, "args": { "External id": 19863,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651127939.385, "dur": 34747.698, "args": { "External id": 19864,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651127943.339, "dur": 5.080, "args": { "External id": 19865,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651127950.265, "dur": 34733.338, "args": { "External id": 19866,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651162828.504, "dur": 9.569, "args": { "External id": 19867,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651162831.799, "dur": 5.926, "args": { "External id": 19868,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2459 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651162868.419, "dur": 396.049, "args": { "External id": 19869,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2460 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651162896.164, "dur": 362.044, "args": { "External id": 19870,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2461, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651162907.877, "dur": 344.337, "args": { "External id": 19871,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2462 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651163285.381, "dur": 2.721, "args": { "External id": 19872,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2463, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651163350.203, "dur": 6.973, "args": { "External id": 19873,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651163404.679, "dur": 1.560, "args": { "External id": 19874,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651163423.247, "dur": 1.135, "args": { "External id": 19875,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651163436.847, "dur": 0.998, "args": { "External id": 19876,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651163450.315, "dur": 1.197, "args": { "External id": 19877,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651163462.442, "dur": 1.054, "args": { "External id": 19878,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651163474.132, "dur": 1.080, "args": { "External id": 19879,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651163487.157, "dur": 2.310, "args": { "External id": 19880,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651163499.915, "dur": 0.967, "args": { "External id": 19881,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2472 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651163592.173, "dur": 2745.872, "args": { "External id": 19882,"Record function id": 0, "Ev Idx": 2473 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.21)", "pid": 1336759, "tid": 1381173, "ts": 1295651163611.373, "dur": 1018.105, "args": { "External id": 19883,"Record function id": 0, "Ev Idx": 2474 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.21)", "pid": 1336759, "tid": 1381173, "ts": 1295651163626.808, "dur": 310.002, "args": { "External id": 19884,"Record function id": 0, "Ev Idx": 2475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651163699.059, "dur": 4.442, "args": { "External id": 19885,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651163706.521, "dur": 1.197, "args": { "External id": 19886,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651163709.954, "dur": 0.946, "args": { "External id": 19887,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651163712.462, "dur": 1.313, "args": { "External id": 19888,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651163715.223, "dur": 1.120, "args": { "External id": 19889,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651163719.382, "dur": 1.056, "args": { "External id": 19890,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651163721.962, "dur": 1.846, "args": { "External id": 19891,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651163725.131, "dur": 0.961, "args": { "External id": 19892,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651163727.426, "dur": 0.868, "args": { "External id": 19893,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651163731.294, "dur": 0.733, "args": { "External id": 19894,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2485 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651163749.856, "dur": 155.563, "args": { "External id": 19895,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651163774.026, "dur": 126.968, "args": { "External id": 19896,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651163791.803, "dur": 12.027, "args": { "External id": 19897,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651163806.861, "dur": 68.180, "args": { "External id": 19898,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651163809.165, "dur": 65.600, "args": { "External id": 19899,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651163812.951, "dur": 7.328, "args": { "External id": 19900,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651163821.699, "dur": 52.477, "args": { "External id": 19901,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2492 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.20", "pid": 1336759, "tid": 1381173, "ts": 1295651164060.258, "dur": 560.936, "args": { "External id": 19902,"Record function id": 0, "Ev Idx": 2493 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.20)", "pid": 1336759, "tid": 1381173, "ts": 1295651164079.044, "dur": 529.955, "args": { "External id": 19903,"Record function id": 0, "Ev Idx": 2494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651164136.457, "dur": 5.560, "args": { "External id": 19904,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651164158.216, "dur": 33.714, "args": { "External id": 19905,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164163.355, "dur": 1.942, "args": { "External id": 19906,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164167.706, "dur": 0.540, "args": { "External id": 19907,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164169.961, "dur": 4.037, "args": { "External id": 19908,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164175.655, "dur": 0.618, "args": { "External id": 19909,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164178.210, "dur": 0.468, "args": { "External id": 19910,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164180.198, "dur": 0.444, "args": { "External id": 19911,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164182.391, "dur": 0.514, "args": { "External id": 19912,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164184.178, "dur": 0.598, "args": { "External id": 19913,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2504 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164186.426, "dur": 0.364, "args": { "External id": 19914,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651164201.075, "dur": 49.359, "args": { "External id": 19915,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2506 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651164285.451, "dur": 101.744, "args": { "External id": 19916,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651164295.739, "dur": 4.659, "args": { "External id": 19917,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651164305.113, "dur": 11.524, "args": { "External id": 19918,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651164309.373, "dur": 6.850, "args": { "External id": 19919,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164313.532, "dur": 1.146, "args": { "External id": 19920,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651164323.864, "dur": 25.043, "args": { "External id": 19921,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164326.302, "dur": 0.665, "args": { "External id": 19922,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164328.746, "dur": 0.503, "args": { "External id": 19923,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164330.662, "dur": 0.642, "args": { "External id": 19924,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164332.922, "dur": 0.681, "args": { "External id": 19925,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2516 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164335.013, "dur": 0.518, "args": { "External id": 19926,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2517 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164337.148, "dur": 0.776, "args": { "External id": 19927,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164339.390, "dur": 0.951, "args": { "External id": 19928,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164341.900, "dur": 0.516, "args": { "External id": 19929,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651164343.873, "dur": 0.530, "args": { "External id": 19930,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651164358.209, "dur": 21.039, "args": { "External id": 19931,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2522 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651164431.797, "dur": 113.503, "args": { "External id": 19932,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2523 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651164453.743, "dur": 87.977, "args": { "External id": 19933,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2524, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651164463.867, "dur": 73.819, "args": { "External id": 19934,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2525 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651164559.370, "dur": 1.848, "args": { "External id": 19935,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2526, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651164636.793, "dur": 1681.136, "args": { "External id": 19936,"Sequence number": 246584, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2527 } }, { "ph": "f", "id": 184, "pid": 1336759, "tid": 1381173, "ts": 1295651164636.793, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651164742.890, "dur": 105.365, "args": { "External id": 19937,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2528 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651164887.709, "dur": 37.414, "args": { "External id": 19938,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651164941.504, "dur": 91.654, "args": { "External id": 19939,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651165047.865, "dur": 37.429, "args": { "External id": 19940,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651165092.434, "dur": 45.877, "args": { "External id": 19941,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651165145.590, "dur": 28.274, "args": { "External id": 19942,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651165181.402, "dur": 41.438, "args": { "External id": 19943,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2534 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651165265.662, "dur": 24.496, "args": { "External id": 19944,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2535 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651165310.413, "dur": 26.420, "args": { "External id": 19945,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2536 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651165358.985, "dur": 18.487, "args": { "External id": 19946,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2537 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651165394.763, "dur": 14.218, "args": { "External id": 19947,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651165418.903, "dur": 32.488, "args": { "External id": 19948,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651165455.331, "dur": 32.757, "args": { "External id": 19949,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2540 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651165518.460, "dur": 169.716, "args": { "External id": 19950,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651165597.259, "dur": 6.212, "args": { "External id": 19951,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651165605.672, "dur": 2.602, "args": { "External id": 19952,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2543 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651165729.852, "dur": 24.195, "args": { "External id": 19953,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2544 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651165767.155, "dur": 14.394, "args": { "External id": 19954,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651165790.960, "dur": 37.131, "args": { "External id": 19955,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651165835.546, "dur": 38.141, "args": { "External id": 19956,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651165882.000, "dur": 21.613, "args": { "External id": 19957,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651165909.630, "dur": 32.573, "args": { "External id": 19958,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651165949.884, "dur": 20.575, "args": { "External id": 19959,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651165978.310, "dur": 74.328, "args": { "External id": 19960,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2551 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651166079.773, "dur": 36.949, "args": { "External id": 19961,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2552 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651166144.894, "dur": 23.257, "args": { "External id": 19962,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2553 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651166182.594, "dur": 20.144, "args": { "External id": 19963,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2554 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651166218.734, "dur": 34.176, "args": { "External id": 19964,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2555 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651166270.377, "dur": 16.758, "args": { "External id": 19965,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2556 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166360.731, "dur": 40.114, "args": { "External id": 19966,"Record function id": 0, "Ev Idx": 2557 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166364.181, "dur": 35.494, "args": { "External id": 19967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166368.498, "dur": 30.158, "args": { "External id": 19968,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2559 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166393.818, "dur": 4.682, "args": { "External id": 19969,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2560 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166405.024, "dur": 5.720, "args": { "External id": 19970,"Record function id": 0, "Ev Idx": 2561 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166406.325, "dur": 3.963, "args": { "External id": 19971,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166407.057, "dur": 2.663, "args": { "External id": 19972,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2563 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166408.004, "dur": 1.628, "args": { "External id": 19973,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2564 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166413.971, "dur": 4.489, "args": { "External id": 19974,"Record function id": 0, "Ev Idx": 2565 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166415.277, "dur": 2.765, "args": { "External id": 19975,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166415.805, "dur": 1.703, "args": { "External id": 19976,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2567 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166416.125, "dur": 1.304, "args": { "External id": 19977,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2568 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166421.593, "dur": 3.869, "args": { "External id": 19978,"Record function id": 0, "Ev Idx": 2569 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166422.575, "dur": 2.485, "args": { "External id": 19979,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166423.140, "dur": 1.501, "args": { "External id": 19980,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2571 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166423.427, "dur": 1.131, "args": { "External id": 19981,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2572 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166428.462, "dur": 3.799, "args": { "External id": 19982,"Record function id": 0, "Ev Idx": 2573 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166429.544, "dur": 2.304, "args": { "External id": 19983,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166430.035, "dur": 1.361, "args": { "External id": 19984,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2575 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166430.329, "dur": 1.000, "args": { "External id": 19985,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2576 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166435.304, "dur": 3.856, "args": { "External id": 19986,"Record function id": 0, "Ev Idx": 2577 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166436.467, "dur": 2.301, "args": { "External id": 19987,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166436.965, "dur": 1.378, "args": { "External id": 19988,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2579 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166437.382, "dur": 0.885, "args": { "External id": 19989,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2580 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166442.429, "dur": 3.995, "args": { "External id": 19990,"Record function id": 0, "Ev Idx": 2581 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166443.785, "dur": 2.219, "args": { "External id": 19991,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166444.233, "dur": 1.344, "args": { "External id": 19992,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2583 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166444.502, "dur": 0.993, "args": { "External id": 19993,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2584 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166449.811, "dur": 5.573, "args": { "External id": 19994,"Record function id": 0, "Ev Idx": 2585 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166450.762, "dur": 4.221, "args": { "External id": 19995,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166451.239, "dur": 3.331, "args": { "External id": 19996,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2587 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166453.648, "dur": 0.814, "args": { "External id": 19997,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2588 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166458.610, "dur": 3.293, "args": { "External id": 19998,"Record function id": 0, "Ev Idx": 2589 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651166459.559, "dur": 1.936, "args": { "External id": 19999,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166460.049, "dur": 1.025, "args": { "External id": 20000,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2591 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651166460.317, "dur": 0.675, "args": { "External id": 20001,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2592 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651166465.644, "dur": 38016.590, "args": { "External id": 20002,"Record function id": 0, "Sequence number": 246583, "Fwd thread id": 1, "Ev Idx": 2593 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651166467.050, "dur": 38006.189, "args": { "External id": 20003,"Sequence number": 246583, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2594 } }, { "ph": "f", "id": 185, "pid": 1336759, "tid": 1381173, "ts": 1295651166467.050, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.21)", "pid": 1336759, "tid": 1381173, "ts": 1295651166502.229, "dur": 40.826, "args": { "External id": 20004,"Record function id": 0, "Ev Idx": 2595 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.21)", "pid": 1336759, "tid": 1381173, "ts": 1295651166550.571, "dur": 59.539, "args": { "External id": 20005,"Record function id": 0, "Ev Idx": 2596 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.21)", "pid": 1336759, "tid": 1381173, "ts": 1295651166616.472, "dur": 37849.048, "args": { "External id": 20006,"Record function id": 0, "Ev Idx": 2597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651166705.424, "dur": 6.666, "args": { "External id": 20007,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651166721.624, "dur": 4.833, "args": { "External id": 20008,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2599 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651166744.999, "dur": 36722.168, "args": { "External id": 20009,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651166761.192, "dur": 36696.274, "args": { "External id": 20010,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651166814.175, "dur": 14.512, "args": { "External id": 20011,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651166835.336, "dur": 36583.818, "args": { "External id": 20012,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651166837.981, "dur": 36580.464, "args": { "External id": 20013,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651166841.755, "dur": 4.953, "args": { "External id": 20014,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651166848.681, "dur": 36566.287, "args": { "External id": 20015,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651203559.833, "dur": 9.448, "args": { "External id": 20016,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651203562.906, "dur": 6.025, "args": { "External id": 20017,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2608 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651203599.179, "dur": 551.863, "args": { "External id": 20018,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2609 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651203625.806, "dur": 515.765, "args": { "External id": 20019,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2610, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651203637.597, "dur": 496.786, "args": { "External id": 20020,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2611 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651204174.857, "dur": 2.035, "args": { "External id": 20021,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2612, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651204262.822, "dur": 7.503, "args": { "External id": 20022,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651204316.361, "dur": 1.736, "args": { "External id": 20023,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651204333.647, "dur": 0.977, "args": { "External id": 20024,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651204345.065, "dur": 1.166, "args": { "External id": 20025,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651204355.670, "dur": 1.128, "args": { "External id": 20026,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651204367.717, "dur": 1.470, "args": { "External id": 20027,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651204378.975, "dur": 1.282, "args": { "External id": 20028,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651204391.255, "dur": 2.210, "args": { "External id": 20029,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651204402.585, "dur": 1.217, "args": { "External id": 20030,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2621 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651204498.497, "dur": 2713.540, "args": { "External id": 20031,"Record function id": 0, "Ev Idx": 2622 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.20)", "pid": 1336759, "tid": 1381173, "ts": 1295651204517.535, "dur": 1015.120, "args": { "External id": 20032,"Record function id": 0, "Ev Idx": 2623 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.20)", "pid": 1336759, "tid": 1381173, "ts": 1295651204533.338, "dur": 310.862, "args": { "External id": 20033,"Record function id": 0, "Ev Idx": 2624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651204607.270, "dur": 4.312, "args": { "External id": 20034,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651204614.557, "dur": 1.012, "args": { "External id": 20035,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651204617.474, "dur": 1.713, "args": { "External id": 20036,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651204620.777, "dur": 1.172, "args": { "External id": 20037,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651204623.211, "dur": 1.156, "args": { "External id": 20038,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651204626.013, "dur": 0.940, "args": { "External id": 20039,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651204628.479, "dur": 1.984, "args": { "External id": 20040,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651204631.844, "dur": 1.002, "args": { "External id": 20041,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651204634.072, "dur": 1.580, "args": { "External id": 20042,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651204636.977, "dur": 1.674, "args": { "External id": 20043,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2634 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651204658.509, "dur": 150.448, "args": { "External id": 20044,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651204673.903, "dur": 130.570, "args": { "External id": 20045,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651204695.498, "dur": 12.584, "args": { "External id": 20046,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651204711.594, "dur": 66.517, "args": { "External id": 20047,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651204714.292, "dur": 63.377, "args": { "External id": 20048,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651204718.538, "dur": 6.360, "args": { "External id": 20049,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651204727.010, "dur": 49.966, "args": { "External id": 20050,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2641 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.19", "pid": 1336759, "tid": 1381173, "ts": 1295651204918.503, "dur": 605.099, "args": { "External id": 20051,"Record function id": 0, "Ev Idx": 2642 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.19)", "pid": 1336759, "tid": 1381173, "ts": 1295651204934.208, "dur": 576.628, "args": { "External id": 20052,"Record function id": 0, "Ev Idx": 2643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651205030.136, "dur": 6.782, "args": { "External id": 20053,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651205053.657, "dur": 31.086, "args": { "External id": 20054,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205059.124, "dur": 1.749, "args": { "External id": 20055,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205063.041, "dur": 0.729, "args": { "External id": 20056,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205065.109, "dur": 0.868, "args": { "External id": 20057,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205067.362, "dur": 0.698, "args": { "External id": 20058,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205069.725, "dur": 0.689, "args": { "External id": 20059,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205071.863, "dur": 0.752, "args": { "External id": 20060,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205074.274, "dur": 0.796, "args": { "External id": 20061,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205076.567, "dur": 0.549, "args": { "External id": 20062,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205078.804, "dur": 0.892, "args": { "External id": 20063,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651205095.084, "dur": 33.361, "args": { "External id": 20064,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2655 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651205163.725, "dur": 121.701, "args": { "External id": 20065,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651205173.106, "dur": 3.935, "args": { "External id": 20066,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651205181.868, "dur": 10.719, "args": { "External id": 20067,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651205186.252, "dur": 5.903, "args": { "External id": 20068,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205190.183, "dur": 0.838, "args": { "External id": 20069,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651205199.218, "dur": 26.452, "args": { "External id": 20070,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205201.911, "dur": 0.835, "args": { "External id": 20071,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205204.539, "dur": 0.607, "args": { "External id": 20072,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205207.009, "dur": 0.618, "args": { "External id": 20073,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205209.143, "dur": 0.716, "args": { "External id": 20074,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205211.198, "dur": 1.049, "args": { "External id": 20075,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205213.572, "dur": 0.617, "args": { "External id": 20076,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205215.968, "dur": 0.788, "args": { "External id": 20077,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205218.147, "dur": 0.809, "args": { "External id": 20078,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651205220.338, "dur": 1.004, "args": { "External id": 20079,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651205255.543, "dur": 21.454, "args": { "External id": 20080,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2671 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651205333.366, "dur": 110.197, "args": { "External id": 20081,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2672 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651205354.702, "dur": 85.513, "args": { "External id": 20082,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2673, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651205364.923, "dur": 70.390, "args": { "External id": 20083,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2674 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651205457.394, "dur": 1.870, "args": { "External id": 20084,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2675, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651205539.914, "dur": 1649.858, "args": { "External id": 20085,"Sequence number": 246582, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2676 } }, { "ph": "f", "id": 186, "pid": 1336759, "tid": 1381173, "ts": 1295651205539.914, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651205645.432, "dur": 102.211, "args": { "External id": 20086,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2677 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651205789.383, "dur": 40.177, "args": { "External id": 20087,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651205848.640, "dur": 48.852, "args": { "External id": 20088,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2679 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651205907.573, "dur": 32.266, "args": { "External id": 20089,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651205948.213, "dur": 89.911, "args": { "External id": 20090,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651206051.466, "dur": 32.741, "args": { "External id": 20091,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651206093.512, "dur": 42.742, "args": { "External id": 20092,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2683 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651206162.759, "dur": 21.721, "args": { "External id": 20093,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2684 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651206206.715, "dur": 46.933, "args": { "External id": 20094,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2685 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651206277.859, "dur": 20.382, "args": { "External id": 20095,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2686 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651206313.001, "dur": 14.271, "args": { "External id": 20096,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651206338.589, "dur": 33.100, "args": { "External id": 20097,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651206375.280, "dur": 33.003, "args": { "External id": 20098,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2689 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651206437.748, "dur": 181.338, "args": { "External id": 20099,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651206518.358, "dur": 6.863, "args": { "External id": 20100,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651206527.256, "dur": 2.772, "args": { "External id": 20101,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2692 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651206648.687, "dur": 26.881, "args": { "External id": 20102,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2693 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651206687.127, "dur": 13.482, "args": { "External id": 20103,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2694 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651206709.876, "dur": 33.796, "args": { "External id": 20104,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651206751.873, "dur": 33.396, "args": { "External id": 20105,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651206794.080, "dur": 21.617, "args": { "External id": 20106,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651206821.888, "dur": 29.335, "args": { "External id": 20107,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651206858.584, "dur": 23.948, "args": { "External id": 20108,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651206889.684, "dur": 29.346, "args": { "External id": 20109,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2700 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651206939.865, "dur": 35.077, "args": { "External id": 20110,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2701 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651207035.249, "dur": 26.532, "args": { "External id": 20111,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2702 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651207076.787, "dur": 16.812, "args": { "External id": 20112,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2703 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651207110.233, "dur": 15.694, "args": { "External id": 20113,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2704 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651207139.534, "dur": 19.394, "args": { "External id": 20114,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2705 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207250.131, "dur": 20.912, "args": { "External id": 20115,"Record function id": 0, "Ev Idx": 2706 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207254.225, "dur": 15.474, "args": { "External id": 20116,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207261.544, "dur": 6.808, "args": { "External id": 20117,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2708 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207263.288, "dur": 4.797, "args": { "External id": 20118,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2709 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207276.076, "dur": 4.742, "args": { "External id": 20119,"Record function id": 0, "Ev Idx": 2710 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207277.238, "dur": 3.122, "args": { "External id": 20120,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207277.899, "dur": 2.066, "args": { "External id": 20121,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2712 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207278.532, "dur": 1.322, "args": { "External id": 20122,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2713 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207284.280, "dur": 5.035, "args": { "External id": 20123,"Record function id": 0, "Ev Idx": 2714 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207286.333, "dur": 2.530, "args": { "External id": 20124,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207286.905, "dur": 1.558, "args": { "External id": 20125,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2716 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207287.362, "dur": 1.024, "args": { "External id": 20126,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2717 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207292.755, "dur": 4.033, "args": { "External id": 20127,"Record function id": 0, "Ev Idx": 2718 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207293.756, "dur": 2.578, "args": { "External id": 20128,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207294.387, "dur": 1.529, "args": { "External id": 20129,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2720 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207295.028, "dur": 0.786, "args": { "External id": 20130,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2721 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207300.065, "dur": 4.098, "args": { "External id": 20131,"Record function id": 0, "Ev Idx": 2722 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207301.068, "dur": 2.666, "args": { "External id": 20132,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207301.586, "dur": 1.728, "args": { "External id": 20133,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2724 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207301.992, "dur": 1.135, "args": { "External id": 20134,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2725 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207307.288, "dur": 3.497, "args": { "External id": 20135,"Record function id": 0, "Ev Idx": 2726 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207308.292, "dur": 2.095, "args": { "External id": 20136,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207308.849, "dur": 1.092, "args": { "External id": 20137,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2728 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207309.102, "dur": 0.743, "args": { "External id": 20138,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2729 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207314.032, "dur": 7.155, "args": { "External id": 20139,"Record function id": 0, "Ev Idx": 2730 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207315.070, "dur": 5.721, "args": { "External id": 20140,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207315.531, "dur": 4.836, "args": { "External id": 20141,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2732 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207319.287, "dur": 0.982, "args": { "External id": 20142,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2733 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207324.333, "dur": 3.714, "args": { "External id": 20143,"Record function id": 0, "Ev Idx": 2734 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207325.324, "dur": 2.336, "args": { "External id": 20144,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207325.967, "dur": 1.300, "args": { "External id": 20145,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2736 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207326.314, "dur": 0.877, "args": { "External id": 20146,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2737 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207331.153, "dur": 3.753, "args": { "External id": 20147,"Record function id": 0, "Ev Idx": 2738 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651207332.214, "dur": 2.281, "args": { "External id": 20148,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207332.709, "dur": 1.392, "args": { "External id": 20149,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2740 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651207333.266, "dur": 0.746, "args": { "External id": 20150,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2741 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651207338.522, "dur": 35070.110, "args": { "External id": 20151,"Record function id": 0, "Sequence number": 246581, "Fwd thread id": 1, "Ev Idx": 2742 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651207339.793, "dur": 35060.516, "args": { "External id": 20152,"Sequence number": 246581, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2743 } }, { "ph": "f", "id": 187, "pid": 1336759, "tid": 1381173, "ts": 1295651207339.793, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.20)", "pid": 1336759, "tid": 1381173, "ts": 1295651207369.749, "dur": 38.499, "args": { "External id": 20153,"Record function id": 0, "Ev Idx": 2744 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.20)", "pid": 1336759, "tid": 1381173, "ts": 1295651207415.702, "dur": 62.892, "args": { "External id": 20154,"Record function id": 0, "Ev Idx": 2745 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.20)", "pid": 1336759, "tid": 1381173, "ts": 1295651207485.342, "dur": 34906.771, "args": { "External id": 20155,"Record function id": 0, "Ev Idx": 2746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651207570.217, "dur": 6.532, "args": { "External id": 20156,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651207586.432, "dur": 5.010, "args": { "External id": 20157,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2748 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651207606.874, "dur": 33964.833, "args": { "External id": 20158,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651207619.850, "dur": 33941.962, "args": { "External id": 20159,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651207696.743, "dur": 14.197, "args": { "External id": 20160,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651207717.671, "dur": 33805.434, "args": { "External id": 20161,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651207720.410, "dur": 33801.896, "args": { "External id": 20162,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651207724.164, "dur": 5.510, "args": { "External id": 20163,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651207731.903, "dur": 33786.271, "args": { "External id": 20164,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651241665.298, "dur": 10.063, "args": { "External id": 20165,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651241668.616, "dur": 6.438, "args": { "External id": 20166,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2757 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651241710.315, "dur": 383.660, "args": { "External id": 20167,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2758 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651241739.542, "dur": 348.888, "args": { "External id": 20168,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2759, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651241751.083, "dur": 330.003, "args": { "External id": 20169,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2760 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651242115.328, "dur": 2.209, "args": { "External id": 20170,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2761, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242178.019, "dur": 6.856, "args": { "External id": 20171,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242227.503, "dur": 17.389, "args": { "External id": 20172,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242265.789, "dur": 0.960, "args": { "External id": 20173,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242277.206, "dur": 0.779, "args": { "External id": 20174,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242287.298, "dur": 0.800, "args": { "External id": 20175,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242298.281, "dur": 0.769, "args": { "External id": 20176,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242308.491, "dur": 1.143, "args": { "External id": 20177,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242318.956, "dur": 1.951, "args": { "External id": 20178,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242329.788, "dur": 0.841, "args": { "External id": 20179,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2770 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651242424.622, "dur": 2633.697, "args": { "External id": 20180,"Record function id": 0, "Ev Idx": 2771 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.19)", "pid": 1336759, "tid": 1381173, "ts": 1295651242442.709, "dur": 991.101, "args": { "External id": 20181,"Record function id": 0, "Ev Idx": 2772 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.19)", "pid": 1336759, "tid": 1381173, "ts": 1295651242458.033, "dur": 308.362, "args": { "External id": 20182,"Record function id": 0, "Ev Idx": 2773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651242531.944, "dur": 4.265, "args": { "External id": 20183,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651242542.313, "dur": 0.874, "args": { "External id": 20184,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651242544.825, "dur": 0.923, "args": { "External id": 20185,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651242547.419, "dur": 1.126, "args": { "External id": 20186,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651242549.879, "dur": 0.924, "args": { "External id": 20187,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651242555.136, "dur": 1.033, "args": { "External id": 20188,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651242557.716, "dur": 1.681, "args": { "External id": 20189,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651242562.589, "dur": 0.647, "args": { "External id": 20190,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651242564.602, "dur": 0.634, "args": { "External id": 20191,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651242566.690, "dur": 0.600, "args": { "External id": 20192,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2783 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651242584.856, "dur": 150.764, "args": { "External id": 20193,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651242604.387, "dur": 126.452, "args": { "External id": 20194,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651242621.800, "dur": 11.890, "args": { "External id": 20195,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651242637.111, "dur": 66.410, "args": { "External id": 20196,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651242639.903, "dur": 63.327, "args": { "External id": 20197,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242644.260, "dur": 5.083, "args": { "External id": 20198,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651242651.572, "dur": 51.095, "args": { "External id": 20199,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2790 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.18", "pid": 1336759, "tid": 1381173, "ts": 1295651242839.020, "dur": 586.901, "args": { "External id": 20200,"Record function id": 0, "Ev Idx": 2791 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.18)", "pid": 1336759, "tid": 1381173, "ts": 1295651242855.617, "dur": 557.968, "args": { "External id": 20201,"Record function id": 0, "Ev Idx": 2792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651242907.751, "dur": 4.648, "args": { "External id": 20202,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651242927.930, "dur": 27.233, "args": { "External id": 20203,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242932.524, "dur": 1.340, "args": { "External id": 20204,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242936.087, "dur": 0.571, "args": { "External id": 20205,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242938.245, "dur": 0.689, "args": { "External id": 20206,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242941.057, "dur": 0.282, "args": { "External id": 20207,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242942.753, "dur": 0.245, "args": { "External id": 20208,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242944.475, "dur": 0.254, "args": { "External id": 20209,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242946.200, "dur": 0.358, "args": { "External id": 20210,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242948.153, "dur": 0.460, "args": { "External id": 20211,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651242950.033, "dur": 0.439, "args": { "External id": 20212,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651242964.789, "dur": 70.921, "args": { "External id": 20213,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2804 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651243071.046, "dur": 96.764, "args": { "External id": 20214,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651243081.963, "dur": 4.362, "args": { "External id": 20215,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651243091.249, "dur": 10.478, "args": { "External id": 20216,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651243095.340, "dur": 5.977, "args": { "External id": 20217,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651243099.077, "dur": 0.615, "args": { "External id": 20218,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651243108.128, "dur": 22.097, "args": { "External id": 20219,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651243110.453, "dur": 0.446, "args": { "External id": 20220,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651243112.771, "dur": 0.325, "args": { "External id": 20221,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651243114.577, "dur": 0.307, "args": { "External id": 20222,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651243116.630, "dur": 0.272, "args": { "External id": 20223,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651243118.535, "dur": 0.271, "args": { "External id": 20224,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651243120.290, "dur": 0.289, "args": { "External id": 20225,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651243122.181, "dur": 0.324, "args": { "External id": 20226,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651243124.019, "dur": 0.259, "args": { "External id": 20227,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651243125.717, "dur": 0.430, "args": { "External id": 20228,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651243140.059, "dur": 19.853, "args": { "External id": 20229,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2820 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651243211.686, "dur": 131.062, "args": { "External id": 20230,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2821 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651243249.625, "dur": 89.506, "args": { "External id": 20231,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2822, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651243260.869, "dur": 74.119, "args": { "External id": 20232,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2823 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651243358.622, "dur": 1.773, "args": { "External id": 20233,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2824, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651243441.177, "dur": 1595.745, "args": { "External id": 20234,"Sequence number": 246580, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2825 } }, { "ph": "f", "id": 188, "pid": 1336759, "tid": 1381173, "ts": 1295651243441.177, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651243548.072, "dur": 102.596, "args": { "External id": 20235,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2826 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651243689.035, "dur": 36.474, "args": { "External id": 20236,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651243741.920, "dur": 49.752, "args": { "External id": 20237,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651243800.530, "dur": 33.387, "args": { "External id": 20238,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651243840.764, "dur": 44.645, "args": { "External id": 20239,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651243891.977, "dur": 27.044, "args": { "External id": 20240,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651243925.531, "dur": 41.654, "args": { "External id": 20241,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2832 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651244034.092, "dur": 26.404, "args": { "External id": 20242,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2833 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651244080.554, "dur": 26.734, "args": { "External id": 20243,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2834 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651244129.905, "dur": 18.325, "args": { "External id": 20244,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2835 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651244161.905, "dur": 15.635, "args": { "External id": 20245,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651244187.317, "dur": 31.484, "args": { "External id": 20246,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651244221.975, "dur": 52.399, "args": { "External id": 20247,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2838 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651244308.365, "dur": 177.632, "args": { "External id": 20248,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651244389.678, "dur": 5.943, "args": { "External id": 20249,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651244398.016, "dur": 2.327, "args": { "External id": 20250,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2841 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651244514.216, "dur": 24.847, "args": { "External id": 20251,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2842 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651244549.870, "dur": 16.606, "args": { "External id": 20252,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651244574.980, "dur": 36.934, "args": { "External id": 20253,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651244617.991, "dur": 36.044, "args": { "External id": 20254,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651244661.008, "dur": 19.647, "args": { "External id": 20255,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651244685.128, "dur": 29.857, "args": { "External id": 20256,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651244720.836, "dur": 19.188, "args": { "External id": 20257,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651244746.238, "dur": 28.683, "args": { "External id": 20258,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2849 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651244790.637, "dur": 20.260, "args": { "External id": 20259,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2850 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651244830.115, "dur": 39.890, "args": { "External id": 20260,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2851 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651244890.776, "dur": 16.373, "args": { "External id": 20261,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2852 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651244926.759, "dur": 14.165, "args": { "External id": 20262,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2853 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651244953.952, "dur": 14.971, "args": { "External id": 20263,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2854 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245081.591, "dur": 14.987, "args": { "External id": 20264,"Record function id": 0, "Ev Idx": 2855 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245084.961, "dur": 10.685, "args": { "External id": 20265,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245088.978, "dur": 5.749, "args": { "External id": 20266,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2857 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245090.219, "dur": 4.406, "args": { "External id": 20267,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2858 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245100.549, "dur": 4.170, "args": { "External id": 20268,"Record function id": 0, "Ev Idx": 2859 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245101.841, "dur": 2.455, "args": { "External id": 20269,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245102.477, "dur": 1.344, "args": { "External id": 20270,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2861 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245102.951, "dur": 0.770, "args": { "External id": 20271,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2862 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245108.154, "dur": 4.044, "args": { "External id": 20272,"Record function id": 0, "Ev Idx": 2863 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245109.391, "dur": 2.338, "args": { "External id": 20273,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245109.954, "dur": 1.318, "args": { "External id": 20274,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2865 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245110.493, "dur": 0.672, "args": { "External id": 20275,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2866 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245115.346, "dur": 3.581, "args": { "External id": 20276,"Record function id": 0, "Ev Idx": 2867 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245116.422, "dur": 2.073, "args": { "External id": 20277,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245116.930, "dur": 1.127, "args": { "External id": 20278,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2869 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245117.177, "dur": 0.796, "args": { "External id": 20279,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2870 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245122.057, "dur": 3.707, "args": { "External id": 20280,"Record function id": 0, "Ev Idx": 2871 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245123.182, "dur": 2.133, "args": { "External id": 20281,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245123.675, "dur": 1.229, "args": { "External id": 20282,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2873 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245123.935, "dur": 0.894, "args": { "External id": 20283,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2874 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245128.830, "dur": 4.264, "args": { "External id": 20284,"Record function id": 0, "Ev Idx": 2875 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245129.869, "dur": 2.800, "args": { "External id": 20285,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245130.639, "dur": 1.632, "args": { "External id": 20286,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2877 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245131.165, "dur": 1.030, "args": { "External id": 20287,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2878 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245136.102, "dur": 3.981, "args": { "External id": 20288,"Record function id": 0, "Ev Idx": 2879 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245137.255, "dur": 2.414, "args": { "External id": 20289,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245137.829, "dur": 1.426, "args": { "External id": 20290,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2881 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245138.322, "dur": 0.867, "args": { "External id": 20291,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2882 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245143.103, "dur": 3.750, "args": { "External id": 20292,"Record function id": 0, "Ev Idx": 2883 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245144.056, "dur": 2.389, "args": { "External id": 20293,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245144.651, "dur": 1.374, "args": { "External id": 20294,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2885 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245145.037, "dur": 0.922, "args": { "External id": 20295,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2886 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245149.850, "dur": 3.448, "args": { "External id": 20296,"Record function id": 0, "Ev Idx": 2887 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651245150.787, "dur": 2.094, "args": { "External id": 20297,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245151.289, "dur": 1.177, "args": { "External id": 20298,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2889 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651245151.701, "dur": 0.700, "args": { "External id": 20299,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2890 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651245156.962, "dur": 36224.496, "args": { "External id": 20300,"Record function id": 0, "Sequence number": 246579, "Fwd thread id": 1, "Ev Idx": 2891 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651245158.022, "dur": 36214.933, "args": { "External id": 20301,"Sequence number": 246579, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2892 } }, { "ph": "f", "id": 189, "pid": 1336759, "tid": 1381173, "ts": 1295651245158.022, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.19)", "pid": 1336759, "tid": 1381173, "ts": 1295651245188.749, "dur": 55.425, "args": { "External id": 20302,"Record function id": 0, "Ev Idx": 2893 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.19)", "pid": 1336759, "tid": 1381173, "ts": 1295651245256.161, "dur": 65.046, "args": { "External id": 20303,"Record function id": 0, "Ev Idx": 2894 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.19)", "pid": 1336759, "tid": 1381173, "ts": 1295651245330.608, "dur": 36033.867, "args": { "External id": 20304,"Record function id": 0, "Ev Idx": 2895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651245424.047, "dur": 7.637, "args": { "External id": 20305,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651245441.415, "dur": 8.454, "args": { "External id": 20306,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2897 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651245465.442, "dur": 35011.850, "args": { "External id": 20307,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651245478.733, "dur": 34990.293, "args": { "External id": 20308,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651245537.207, "dur": 14.186, "args": { "External id": 20309,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651245557.778, "dur": 34872.612, "args": { "External id": 20310,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651245560.549, "dur": 34869.076, "args": { "External id": 20311,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651245564.591, "dur": 5.332, "args": { "External id": 20312,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651245571.782, "dur": 34854.491, "args": { "External id": 20313,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651280565.114, "dur": 10.401, "args": { "External id": 20314,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651280569.274, "dur": 5.925, "args": { "External id": 20315,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2906 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651280603.484, "dur": 450.926, "args": { "External id": 20316,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2907 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651280630.667, "dur": 418.161, "args": { "External id": 20317,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2908, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651280643.598, "dur": 399.456, "args": { "External id": 20318,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2909 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651281076.610, "dur": 2.272, "args": { "External id": 20319,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2910, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281141.999, "dur": 6.995, "args": { "External id": 20320,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281193.376, "dur": 1.251, "args": { "External id": 20321,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281210.018, "dur": 1.138, "args": { "External id": 20322,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281223.228, "dur": 0.798, "args": { "External id": 20323,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281253.358, "dur": 1.549, "args": { "External id": 20324,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281266.228, "dur": 0.880, "args": { "External id": 20325,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281277.841, "dur": 1.044, "args": { "External id": 20326,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281289.788, "dur": 1.925, "args": { "External id": 20327,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281300.765, "dur": 0.802, "args": { "External id": 20328,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2919 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651281398.246, "dur": 2646.901, "args": { "External id": 20329,"Record function id": 0, "Ev Idx": 2920 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.18)", "pid": 1336759, "tid": 1381173, "ts": 1295651281417.377, "dur": 1007.989, "args": { "External id": 20330,"Record function id": 0, "Ev Idx": 2921 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.18)", "pid": 1336759, "tid": 1381173, "ts": 1295651281436.759, "dur": 303.390, "args": { "External id": 20331,"Record function id": 0, "Ev Idx": 2922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651281516.300, "dur": 4.227, "args": { "External id": 20332,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651281523.906, "dur": 0.912, "args": { "External id": 20333,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651281526.506, "dur": 0.948, "args": { "External id": 20334,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651281529.136, "dur": 0.518, "args": { "External id": 20335,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651281530.886, "dur": 0.731, "args": { "External id": 20336,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651281532.758, "dur": 0.554, "args": { "External id": 20337,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651281534.600, "dur": 1.832, "args": { "External id": 20338,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651281537.926, "dur": 0.794, "args": { "External id": 20339,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651281539.809, "dur": 0.616, "args": { "External id": 20340,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651281543.982, "dur": 0.724, "args": { "External id": 20341,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2932 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651281562.540, "dur": 149.358, "args": { "External id": 20342,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651281578.252, "dur": 129.073, "args": { "External id": 20343,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651281598.514, "dur": 13.849, "args": { "External id": 20344,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651281615.508, "dur": 66.343, "args": { "External id": 20345,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651281618.102, "dur": 63.357, "args": { "External id": 20346,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281622.001, "dur": 5.145, "args": { "External id": 20347,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651281628.826, "dur": 52.013, "args": { "External id": 20348,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2939 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.17", "pid": 1336759, "tid": 1381173, "ts": 1295651281814.190, "dur": 603.079, "args": { "External id": 20349,"Record function id": 0, "Ev Idx": 2940 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.17)", "pid": 1336759, "tid": 1381173, "ts": 1295651281830.459, "dur": 574.121, "args": { "External id": 20350,"Record function id": 0, "Ev Idx": 2941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651281884.400, "dur": 5.151, "args": { "External id": 20351,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651281904.694, "dur": 28.845, "args": { "External id": 20352,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281909.647, "dur": 1.431, "args": { "External id": 20353,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281913.010, "dur": 0.345, "args": { "External id": 20354,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281915.085, "dur": 0.444, "args": { "External id": 20355,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281917.063, "dur": 0.437, "args": { "External id": 20356,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281919.179, "dur": 0.372, "args": { "External id": 20357,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281921.057, "dur": 0.243, "args": { "External id": 20358,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281925.724, "dur": 0.345, "args": { "External id": 20359,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281927.502, "dur": 0.425, "args": { "External id": 20360,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651281929.437, "dur": 0.335, "args": { "External id": 20361,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651281942.005, "dur": 29.080, "args": { "External id": 20362,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2953 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651282047.387, "dur": 102.069, "args": { "External id": 20363,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651282058.314, "dur": 5.500, "args": { "External id": 20364,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651282068.738, "dur": 10.370, "args": { "External id": 20365,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651282073.216, "dur": 5.476, "args": { "External id": 20366,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651282076.304, "dur": 0.878, "args": { "External id": 20367,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651282086.302, "dur": 19.865, "args": { "External id": 20368,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651282088.685, "dur": 0.524, "args": { "External id": 20369,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651282090.912, "dur": 0.496, "args": { "External id": 20370,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651282092.610, "dur": 0.386, "args": { "External id": 20371,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651282094.281, "dur": 0.252, "args": { "External id": 20372,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651282095.903, "dur": 0.360, "args": { "External id": 20373,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651282097.427, "dur": 0.440, "args": { "External id": 20374,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651282098.954, "dur": 0.264, "args": { "External id": 20375,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651282100.494, "dur": 0.307, "args": { "External id": 20376,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651282102.300, "dur": 0.261, "args": { "External id": 20377,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651282120.462, "dur": 20.935, "args": { "External id": 20378,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2969 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651282194.017, "dur": 135.087, "args": { "External id": 20379,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2970 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651282222.156, "dur": 103.147, "args": { "External id": 20380,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2971, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651282247.981, "dur": 73.063, "args": { "External id": 20381,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2972 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651282349.146, "dur": 1.507, "args": { "External id": 20382,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2973, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651282432.688, "dur": 1551.130, "args": { "External id": 20383,"Sequence number": 246578, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2974 } }, { "ph": "f", "id": 190, "pid": 1336759, "tid": 1381173, "ts": 1295651282432.688, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651282536.817, "dur": 102.547, "args": { "External id": 20384,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2975 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651282677.007, "dur": 35.913, "args": { "External id": 20385,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651282729.158, "dur": 49.158, "args": { "External id": 20386,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651282787.637, "dur": 31.274, "args": { "External id": 20387,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651282824.898, "dur": 44.842, "args": { "External id": 20388,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651282876.635, "dur": 27.113, "args": { "External id": 20389,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651282910.683, "dur": 41.468, "args": { "External id": 20390,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2981 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651282976.226, "dur": 63.569, "args": { "External id": 20391,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2982 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651283063.446, "dur": 26.349, "args": { "External id": 20392,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2983 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651283113.377, "dur": 18.496, "args": { "External id": 20393,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2984 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651283146.546, "dur": 14.595, "args": { "External id": 20394,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651283172.537, "dur": 32.288, "args": { "External id": 20395,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651283208.140, "dur": 49.564, "args": { "External id": 20396,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2987 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651283285.929, "dur": 175.702, "args": { "External id": 20397,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651283369.654, "dur": 5.824, "args": { "External id": 20398,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651283377.538, "dur": 1.945, "args": { "External id": 20399,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2990 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651283492.539, "dur": 25.085, "args": { "External id": 20400,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2991 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651283529.064, "dur": 14.368, "args": { "External id": 20401,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651283551.974, "dur": 39.018, "args": { "External id": 20402,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651283597.106, "dur": 35.729, "args": { "External id": 20403,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651283639.693, "dur": 20.146, "args": { "External id": 20404,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651283666.906, "dur": 29.340, "args": { "External id": 20405,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651283701.818, "dur": 25.804, "args": { "External id": 20406,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651283733.475, "dur": 29.099, "args": { "External id": 20407,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2998 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651283778.912, "dur": 21.689, "args": { "External id": 20408,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2999 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651283816.914, "dur": 22.278, "args": { "External id": 20409,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3000 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651283870.289, "dur": 22.278, "args": { "External id": 20410,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3001 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651283910.878, "dur": 14.593, "args": { "External id": 20411,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3002 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651283938.403, "dur": 15.289, "args": { "External id": 20412,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3003 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284069.179, "dur": 15.556, "args": { "External id": 20413,"Record function id": 0, "Ev Idx": 3004 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284072.936, "dur": 10.777, "args": { "External id": 20414,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284077.205, "dur": 5.584, "args": { "External id": 20415,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3006 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284078.443, "dur": 4.220, "args": { "External id": 20416,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3007 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284091.834, "dur": 4.373, "args": { "External id": 20417,"Record function id": 0, "Ev Idx": 3008 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284093.073, "dur": 2.596, "args": { "External id": 20418,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284093.755, "dur": 1.444, "args": { "External id": 20419,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3010 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284094.278, "dur": 0.848, "args": { "External id": 20420,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3011 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284099.354, "dur": 4.225, "args": { "External id": 20421,"Record function id": 0, "Ev Idx": 3012 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284100.452, "dur": 2.684, "args": { "External id": 20422,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284101.346, "dur": 1.376, "args": { "External id": 20423,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3014 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284101.940, "dur": 0.687, "args": { "External id": 20424,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3015 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284106.798, "dur": 3.441, "args": { "External id": 20425,"Record function id": 0, "Ev Idx": 3016 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284107.816, "dur": 2.014, "args": { "External id": 20426,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284108.322, "dur": 1.118, "args": { "External id": 20427,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3018 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284108.626, "dur": 0.674, "args": { "External id": 20428,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3019 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284113.439, "dur": 3.962, "args": { "External id": 20429,"Record function id": 0, "Ev Idx": 3020 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284114.626, "dur": 2.321, "args": { "External id": 20430,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284115.199, "dur": 1.344, "args": { "External id": 20431,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3022 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284115.625, "dur": 0.832, "args": { "External id": 20432,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3023 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284120.404, "dur": 3.443, "args": { "External id": 20433,"Record function id": 0, "Ev Idx": 3024 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284121.253, "dur": 2.178, "args": { "External id": 20434,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284121.738, "dur": 1.302, "args": { "External id": 20435,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3026 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284122.276, "dur": 0.671, "args": { "External id": 20436,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3027 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284126.906, "dur": 3.356, "args": { "External id": 20437,"Record function id": 0, "Ev Idx": 3028 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284127.975, "dur": 1.865, "args": { "External id": 20438,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284128.470, "dur": 0.963, "args": { "External id": 20439,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3030 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284128.766, "dur": 0.600, "args": { "External id": 20440,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3031 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284133.259, "dur": 3.528, "args": { "External id": 20441,"Record function id": 0, "Ev Idx": 3032 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284134.352, "dur": 2.020, "args": { "External id": 20442,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284134.899, "dur": 1.069, "args": { "External id": 20443,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3034 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284135.195, "dur": 0.704, "args": { "External id": 20444,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3035 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284139.714, "dur": 3.751, "args": { "External id": 20445,"Record function id": 0, "Ev Idx": 3036 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651284140.886, "dur": 2.130, "args": { "External id": 20446,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284141.381, "dur": 1.124, "args": { "External id": 20447,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3038 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651284141.690, "dur": 0.748, "args": { "External id": 20448,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3039 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651284149.789, "dur": 36307.255, "args": { "External id": 20449,"Record function id": 0, "Sequence number": 246577, "Fwd thread id": 1, "Ev Idx": 3040 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651284150.865, "dur": 36297.735, "args": { "External id": 20450,"Sequence number": 246577, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3041 } }, { "ph": "f", "id": 191, "pid": 1336759, "tid": 1381173, "ts": 1295651284150.865, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.18)", "pid": 1336759, "tid": 1381173, "ts": 1295651284182.825, "dur": 41.195, "args": { "External id": 20451,"Record function id": 0, "Ev Idx": 3042 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.18)", "pid": 1336759, "tid": 1381173, "ts": 1295651284249.265, "dur": 65.872, "args": { "External id": 20452,"Record function id": 0, "Ev Idx": 3043 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.18)", "pid": 1336759, "tid": 1381173, "ts": 1295651284321.313, "dur": 36118.987, "args": { "External id": 20453,"Record function id": 0, "Ev Idx": 3044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651284414.607, "dur": 6.811, "args": { "External id": 20454,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651284431.317, "dur": 4.984, "args": { "External id": 20455,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3046 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651284451.578, "dur": 35073.770, "args": { "External id": 20456,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651284474.774, "dur": 35040.969, "args": { "External id": 20457,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651284527.317, "dur": 13.405, "args": { "External id": 20458,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651284547.025, "dur": 34932.177, "args": { "External id": 20459,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651284549.902, "dur": 34928.556, "args": { "External id": 20460,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651284554.002, "dur": 5.663, "args": { "External id": 20461,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651284561.426, "dur": 34913.442, "args": { "External id": 20462,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651319615.868, "dur": 8.980, "args": { "External id": 20463,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651319618.740, "dur": 5.748, "args": { "External id": 20464,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3055 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651319652.446, "dur": 479.614, "args": { "External id": 20465,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3056 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651319684.832, "dur": 441.087, "args": { "External id": 20466,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3057, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651319696.046, "dur": 423.363, "args": { "External id": 20467,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3058 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651320159.272, "dur": 2.655, "args": { "External id": 20468,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3059, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651320226.748, "dur": 21.395, "args": { "External id": 20469,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651320294.234, "dur": 1.509, "args": { "External id": 20470,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651320311.296, "dur": 1.334, "args": { "External id": 20471,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651320324.406, "dur": 0.741, "args": { "External id": 20472,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651320336.899, "dur": 0.821, "args": { "External id": 20473,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651320347.616, "dur": 0.874, "args": { "External id": 20474,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651320357.536, "dur": 0.803, "args": { "External id": 20475,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651320367.741, "dur": 1.877, "args": { "External id": 20476,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651320378.557, "dur": 0.746, "args": { "External id": 20477,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3068 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651320472.433, "dur": 2668.098, "args": { "External id": 20478,"Record function id": 0, "Ev Idx": 3069 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.17)", "pid": 1336759, "tid": 1381173, "ts": 1295651320492.997, "dur": 1022.511, "args": { "External id": 20479,"Record function id": 0, "Ev Idx": 3070 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.17)", "pid": 1336759, "tid": 1381173, "ts": 1295651320511.553, "dur": 320.202, "args": { "External id": 20480,"Record function id": 0, "Ev Idx": 3071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651320614.253, "dur": 4.297, "args": { "External id": 20481,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651320621.852, "dur": 0.726, "args": { "External id": 20482,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651320624.159, "dur": 0.677, "args": { "External id": 20483,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651320628.263, "dur": 0.543, "args": { "External id": 20484,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651320629.990, "dur": 0.646, "args": { "External id": 20485,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651320631.732, "dur": 0.551, "args": { "External id": 20486,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651320633.459, "dur": 1.537, "args": { "External id": 20487,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651320638.309, "dur": 0.753, "args": { "External id": 20488,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651320640.301, "dur": 0.689, "args": { "External id": 20489,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651320642.056, "dur": 0.999, "args": { "External id": 20490,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3081 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651320661.318, "dur": 141.855, "args": { "External id": 20491,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651320677.848, "dur": 120.990, "args": { "External id": 20492,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651320693.813, "dur": 12.543, "args": { "External id": 20493,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651320709.190, "dur": 64.476, "args": { "External id": 20494,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651320711.479, "dur": 61.856, "args": { "External id": 20495,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651320715.431, "dur": 5.160, "args": { "External id": 20496,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651320722.190, "dur": 50.620, "args": { "External id": 20497,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3088 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.16", "pid": 1336759, "tid": 1381173, "ts": 1295651320906.321, "dur": 600.733, "args": { "External id": 20498,"Record function id": 0, "Ev Idx": 3089 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.16)", "pid": 1336759, "tid": 1381173, "ts": 1295651320922.220, "dur": 571.720, "args": { "External id": 20499,"Record function id": 0, "Ev Idx": 3090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651320975.958, "dur": 43.657, "args": { "External id": 20500,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651321038.952, "dur": 24.230, "args": { "External id": 20501,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321043.956, "dur": 1.704, "args": { "External id": 20502,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321047.485, "dur": 0.319, "args": { "External id": 20503,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321049.269, "dur": 0.469, "args": { "External id": 20504,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321050.880, "dur": 0.392, "args": { "External id": 20505,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321052.346, "dur": 0.260, "args": { "External id": 20506,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321053.631, "dur": 0.399, "args": { "External id": 20507,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321055.158, "dur": 0.281, "args": { "External id": 20508,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321056.586, "dur": 0.548, "args": { "External id": 20509,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321058.295, "dur": 0.288, "args": { "External id": 20510,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651321072.606, "dur": 34.567, "args": { "External id": 20511,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3102 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651321138.375, "dur": 110.541, "args": { "External id": 20512,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651321148.367, "dur": 4.406, "args": { "External id": 20513,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651321157.682, "dur": 10.544, "args": { "External id": 20514,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651321161.865, "dur": 5.908, "args": { "External id": 20515,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321165.419, "dur": 1.109, "args": { "External id": 20516,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651321174.699, "dur": 19.295, "args": { "External id": 20517,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321176.920, "dur": 0.290, "args": { "External id": 20518,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321178.405, "dur": 0.618, "args": { "External id": 20519,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321180.196, "dur": 0.316, "args": { "External id": 20520,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321181.572, "dur": 0.302, "args": { "External id": 20521,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321183.111, "dur": 0.454, "args": { "External id": 20522,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321184.835, "dur": 0.417, "args": { "External id": 20523,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321186.656, "dur": 0.403, "args": { "External id": 20524,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321188.151, "dur": 0.402, "args": { "External id": 20525,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651321189.865, "dur": 0.177, "args": { "External id": 20526,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651321206.560, "dur": 19.049, "args": { "External id": 20527,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3118 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651321298.627, "dur": 123.604, "args": { "External id": 20528,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3119 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651321330.770, "dur": 87.902, "args": { "External id": 20529,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3120, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651321340.898, "dur": 73.370, "args": { "External id": 20530,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3121 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651321439.817, "dur": 2.042, "args": { "External id": 20531,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3122, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651321522.915, "dur": 1597.908, "args": { "External id": 20532,"Sequence number": 246576, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3123 } }, { "ph": "f", "id": 192, "pid": 1336759, "tid": 1381173, "ts": 1295651321522.915, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651321629.176, "dur": 102.837, "args": { "External id": 20533,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3124 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651321770.819, "dur": 35.912, "args": { "External id": 20534,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651321822.142, "dur": 47.044, "args": { "External id": 20535,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651321878.592, "dur": 32.084, "args": { "External id": 20536,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651321917.160, "dur": 44.748, "args": { "External id": 20537,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651321968.160, "dur": 68.705, "args": { "External id": 20538,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651322048.439, "dur": 53.528, "args": { "External id": 20539,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3130 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651322130.511, "dur": 23.482, "args": { "External id": 20540,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3131 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651322177.485, "dur": 26.174, "args": { "External id": 20541,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3132 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651322242.553, "dur": 21.439, "args": { "External id": 20542,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3133 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651322285.780, "dur": 14.982, "args": { "External id": 20543,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651322310.130, "dur": 32.075, "args": { "External id": 20544,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651322345.813, "dur": 32.759, "args": { "External id": 20545,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3136 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651322403.282, "dur": 167.827, "args": { "External id": 20546,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651322482.945, "dur": 5.720, "args": { "External id": 20547,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651322490.408, "dur": 2.103, "args": { "External id": 20548,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3139 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651322599.102, "dur": 22.423, "args": { "External id": 20549,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3140 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651322639.885, "dur": 13.754, "args": { "External id": 20550,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651322661.601, "dur": 31.474, "args": { "External id": 20551,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651322698.650, "dur": 32.718, "args": { "External id": 20552,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651322737.712, "dur": 20.257, "args": { "External id": 20553,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651322762.322, "dur": 30.456, "args": { "External id": 20554,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651322798.263, "dur": 19.970, "args": { "External id": 20555,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651322823.469, "dur": 28.502, "args": { "External id": 20556,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3147 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651322871.401, "dur": 21.281, "args": { "External id": 20557,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3148 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651322919.088, "dur": 29.719, "args": { "External id": 20558,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3149 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651322967.818, "dur": 50.985, "args": { "External id": 20559,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3150 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651323043.516, "dur": 16.307, "args": { "External id": 20560,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3151 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651323073.708, "dur": 15.536, "args": { "External id": 20561,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3152 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323166.485, "dur": 15.001, "args": { "External id": 20562,"Record function id": 0, "Ev Idx": 3153 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323169.554, "dur": 10.939, "args": { "External id": 20563,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323174.102, "dur": 5.486, "args": { "External id": 20564,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3155 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323175.582, "dur": 3.884, "args": { "External id": 20565,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3156 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323185.365, "dur": 4.433, "args": { "External id": 20566,"Record function id": 0, "Ev Idx": 3157 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323186.682, "dur": 2.689, "args": { "External id": 20567,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323187.404, "dur": 1.501, "args": { "External id": 20568,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3159 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323187.996, "dur": 0.796, "args": { "External id": 20569,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3160 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323193.084, "dur": 3.784, "args": { "External id": 20570,"Record function id": 0, "Ev Idx": 3161 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323194.325, "dur": 2.110, "args": { "External id": 20571,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323194.813, "dur": 1.196, "args": { "External id": 20572,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3163 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323195.407, "dur": 0.498, "args": { "External id": 20573,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3164 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323200.086, "dur": 4.028, "args": { "External id": 20574,"Record function id": 0, "Ev Idx": 3165 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323201.210, "dur": 2.489, "args": { "External id": 20575,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323201.687, "dur": 1.601, "args": { "External id": 20576,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3167 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323201.964, "dur": 1.215, "args": { "External id": 20577,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3168 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323210.075, "dur": 3.827, "args": { "External id": 20578,"Record function id": 0, "Ev Idx": 3169 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323210.999, "dur": 2.487, "args": { "External id": 20579,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323211.561, "dur": 1.511, "args": { "External id": 20580,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3171 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323212.050, "dur": 0.918, "args": { "External id": 20581,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3172 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323216.919, "dur": 3.780, "args": { "External id": 20582,"Record function id": 0, "Ev Idx": 3173 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323217.856, "dur": 2.398, "args": { "External id": 20583,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323218.459, "dur": 1.378, "args": { "External id": 20584,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3175 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323218.908, "dur": 0.839, "args": { "External id": 20585,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3176 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323223.861, "dur": 19.741, "args": { "External id": 20586,"Record function id": 0, "Ev Idx": 3177 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323224.944, "dur": 2.530, "args": { "External id": 20587,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323225.399, "dur": 1.645, "args": { "External id": 20588,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3179 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323225.659, "dur": 1.322, "args": { "External id": 20589,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3180 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323249.882, "dur": 6.233, "args": { "External id": 20590,"Record function id": 0, "Ev Idx": 3181 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323251.341, "dur": 4.294, "args": { "External id": 20591,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323252.484, "dur": 2.342, "args": { "External id": 20592,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3183 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323253.093, "dur": 1.659, "args": { "External id": 20593,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3184 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323259.268, "dur": 4.347, "args": { "External id": 20594,"Record function id": 0, "Ev Idx": 3185 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651323260.354, "dur": 2.865, "args": { "External id": 20595,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323260.909, "dur": 1.868, "args": { "External id": 20596,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3187 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651323261.552, "dur": 1.156, "args": { "External id": 20597,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3188 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651323267.228, "dur": 36213.258, "args": { "External id": 20598,"Record function id": 0, "Sequence number": 246575, "Fwd thread id": 1, "Ev Idx": 3189 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651323268.464, "dur": 36203.274, "args": { "External id": 20599,"Sequence number": 246575, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3190 } }, { "ph": "f", "id": 193, "pid": 1336759, "tid": 1381173, "ts": 1295651323268.464, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.17)", "pid": 1336759, "tid": 1381173, "ts": 1295651323297.090, "dur": 37.579, "args": { "External id": 20600,"Record function id": 0, "Ev Idx": 3191 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.17)", "pid": 1336759, "tid": 1381173, "ts": 1295651323342.110, "dur": 57.929, "args": { "External id": 20601,"Record function id": 0, "Ev Idx": 3192 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.17)", "pid": 1336759, "tid": 1381173, "ts": 1295651323405.726, "dur": 36057.511, "args": { "External id": 20602,"Record function id": 0, "Ev Idx": 3193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651323493.275, "dur": 10.679, "args": { "External id": 20603,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651323513.830, "dur": 5.025, "args": { "External id": 20604,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3195 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651323532.646, "dur": 35131.564, "args": { "External id": 20605,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651323545.548, "dur": 35109.479, "args": { "External id": 20606,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651323602.283, "dur": 16.842, "args": { "External id": 20607,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651323625.394, "dur": 34989.460, "args": { "External id": 20608,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651323628.288, "dur": 34985.811, "args": { "External id": 20609,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651323632.473, "dur": 5.230, "args": { "External id": 20610,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651323639.399, "dur": 34970.815, "args": { "External id": 20611,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651358754.116, "dur": 9.777, "args": { "External id": 20612,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651358756.912, "dur": 6.536, "args": { "External id": 20613,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3204 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651358792.435, "dur": 371.004, "args": { "External id": 20614,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3205 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651358823.460, "dur": 334.619, "args": { "External id": 20615,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3206, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651358834.576, "dur": 317.348, "args": { "External id": 20616,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3207 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651359187.210, "dur": 2.189, "args": { "External id": 20617,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3208, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651359266.010, "dur": 7.063, "args": { "External id": 20618,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651359317.305, "dur": 1.366, "args": { "External id": 20619,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651359333.248, "dur": 1.535, "args": { "External id": 20620,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651359346.558, "dur": 1.041, "args": { "External id": 20621,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651359359.447, "dur": 1.288, "args": { "External id": 20622,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651359370.392, "dur": 1.232, "args": { "External id": 20623,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651359381.548, "dur": 1.005, "args": { "External id": 20624,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651359392.187, "dur": 1.236, "args": { "External id": 20625,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651359402.441, "dur": 1.089, "args": { "External id": 20626,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3217 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651359499.332, "dur": 2645.622, "args": { "External id": 20627,"Record function id": 0, "Ev Idx": 3218 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.16)", "pid": 1336759, "tid": 1381173, "ts": 1295651359518.033, "dur": 996.782, "args": { "External id": 20628,"Record function id": 0, "Ev Idx": 3219 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.16)", "pid": 1336759, "tid": 1381173, "ts": 1295651359532.694, "dur": 303.415, "args": { "External id": 20629,"Record function id": 0, "Ev Idx": 3220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651359606.838, "dur": 5.195, "args": { "External id": 20630,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651359617.190, "dur": 1.130, "args": { "External id": 20631,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651359620.142, "dur": 1.025, "args": { "External id": 20632,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651359623.092, "dur": 1.624, "args": { "External id": 20633,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651359626.345, "dur": 1.467, "args": { "External id": 20634,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651359631.021, "dur": 1.479, "args": { "External id": 20635,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651359634.291, "dur": 1.386, "args": { "External id": 20636,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651359637.213, "dur": 1.255, "args": { "External id": 20637,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651359640.144, "dur": 1.492, "args": { "External id": 20638,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651359644.927, "dur": 1.241, "args": { "External id": 20639,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3230 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651359664.500, "dur": 144.700, "args": { "External id": 20640,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651359680.150, "dur": 125.233, "args": { "External id": 20641,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651359699.892, "dur": 12.348, "args": { "External id": 20642,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651359715.486, "dur": 63.824, "args": { "External id": 20643,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651359718.068, "dur": 60.877, "args": { "External id": 20644,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651359721.693, "dur": 5.502, "args": { "External id": 20645,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651359728.997, "dur": 49.278, "args": { "External id": 20646,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3237 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.15", "pid": 1336759, "tid": 1381173, "ts": 1295651359908.276, "dur": 598.635, "args": { "External id": 20647,"Record function id": 0, "Ev Idx": 3238 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.15)", "pid": 1336759, "tid": 1381173, "ts": 1295651359923.636, "dur": 570.855, "args": { "External id": 20648,"Record function id": 0, "Ev Idx": 3239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651359974.799, "dur": 4.696, "args": { "External id": 20649,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651360034.738, "dur": 26.802, "args": { "External id": 20650,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360039.784, "dur": 2.922, "args": { "External id": 20651,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360044.347, "dur": 0.362, "args": { "External id": 20652,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360045.582, "dur": 0.680, "args": { "External id": 20653,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360048.104, "dur": 0.778, "args": { "External id": 20654,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360049.977, "dur": 0.676, "args": { "External id": 20655,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360051.691, "dur": 0.678, "args": { "External id": 20656,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360054.030, "dur": 0.567, "args": { "External id": 20657,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360055.677, "dur": 0.809, "args": { "External id": 20658,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360057.293, "dur": 0.714, "args": { "External id": 20659,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651360071.669, "dur": 33.364, "args": { "External id": 20660,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3251 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651360137.258, "dur": 122.111, "args": { "External id": 20661,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651360147.748, "dur": 4.857, "args": { "External id": 20662,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651360157.579, "dur": 13.689, "args": { "External id": 20663,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651360163.947, "dur": 6.881, "args": { "External id": 20664,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360168.081, "dur": 0.996, "args": { "External id": 20665,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651360178.496, "dur": 25.797, "args": { "External id": 20666,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360180.751, "dur": 0.771, "args": { "External id": 20667,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360183.312, "dur": 0.456, "args": { "External id": 20668,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360185.267, "dur": 0.792, "args": { "External id": 20669,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360187.551, "dur": 0.596, "args": { "External id": 20670,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360189.038, "dur": 0.671, "args": { "External id": 20671,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360191.062, "dur": 0.792, "args": { "External id": 20672,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360193.308, "dur": 0.696, "args": { "External id": 20673,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360195.347, "dur": 0.535, "args": { "External id": 20674,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651360197.250, "dur": 0.588, "args": { "External id": 20675,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651360214.965, "dur": 35.074, "args": { "External id": 20676,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3267 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651360306.147, "dur": 118.437, "args": { "External id": 20677,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3268 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651360335.335, "dur": 85.868, "args": { "External id": 20678,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3269, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651360345.354, "dur": 71.576, "args": { "External id": 20679,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3270 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651360442.316, "dur": 1.643, "args": { "External id": 20680,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3271, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651360521.515, "dur": 1603.148, "args": { "External id": 20681,"Sequence number": 246574, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3272 } }, { "ph": "f", "id": 194, "pid": 1336759, "tid": 1381173, "ts": 1295651360521.515, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651360626.504, "dur": 102.548, "args": { "External id": 20682,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3273 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651360767.869, "dur": 36.033, "args": { "External id": 20683,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651360818.918, "dur": 47.046, "args": { "External id": 20684,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651360875.055, "dur": 31.673, "args": { "External id": 20685,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651360913.241, "dur": 44.568, "args": { "External id": 20686,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651360975.039, "dur": 71.230, "args": { "External id": 20687,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651361059.036, "dur": 44.568, "args": { "External id": 20688,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3279 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651361135.436, "dur": 21.905, "args": { "External id": 20689,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3280 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651361179.773, "dur": 25.785, "args": { "External id": 20690,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3281 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651361226.767, "dur": 36.200, "args": { "External id": 20691,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3282 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651361279.020, "dur": 14.958, "args": { "External id": 20692,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651361304.006, "dur": 31.478, "args": { "External id": 20693,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651361339.192, "dur": 32.802, "args": { "External id": 20694,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3285 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651361399.203, "dur": 163.528, "args": { "External id": 20695,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651361475.167, "dur": 5.796, "args": { "External id": 20696,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651361483.126, "dur": 2.397, "args": { "External id": 20697,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3288 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651361594.408, "dur": 22.412, "args": { "External id": 20698,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3289 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651361630.472, "dur": 13.429, "args": { "External id": 20699,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651361651.208, "dur": 31.884, "args": { "External id": 20700,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651361688.883, "dur": 32.514, "args": { "External id": 20701,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651361728.131, "dur": 20.340, "args": { "External id": 20702,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651361752.987, "dur": 32.279, "args": { "External id": 20703,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651361791.216, "dur": 19.288, "args": { "External id": 20704,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651361820.830, "dur": 28.425, "args": { "External id": 20705,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3296 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651361868.024, "dur": 23.254, "args": { "External id": 20706,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3297 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651361908.038, "dur": 22.197, "args": { "External id": 20707,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3298 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651361950.492, "dur": 16.228, "args": { "External id": 20708,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3299 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651361981.686, "dur": 66.507, "args": { "External id": 20709,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3300 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651362075.668, "dur": 18.407, "args": { "External id": 20710,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3301 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362170.787, "dur": 15.674, "args": { "External id": 20711,"Record function id": 0, "Ev Idx": 3302 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362174.139, "dur": 11.281, "args": { "External id": 20712,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362178.455, "dur": 6.010, "args": { "External id": 20713,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3304 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362179.888, "dur": 4.489, "args": { "External id": 20714,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3305 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362190.226, "dur": 4.841, "args": { "External id": 20715,"Record function id": 0, "Ev Idx": 3306 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362191.862, "dur": 2.757, "args": { "External id": 20716,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362192.797, "dur": 1.384, "args": { "External id": 20717,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3308 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362193.234, "dur": 0.877, "args": { "External id": 20718,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3309 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362198.400, "dur": 4.227, "args": { "External id": 20719,"Record function id": 0, "Ev Idx": 3310 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362199.585, "dur": 2.601, "args": { "External id": 20720,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362200.121, "dur": 1.643, "args": { "External id": 20721,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3312 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362200.916, "dur": 0.755, "args": { "External id": 20722,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3313 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362205.901, "dur": 4.293, "args": { "External id": 20723,"Record function id": 0, "Ev Idx": 3314 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362207.253, "dur": 2.502, "args": { "External id": 20724,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362207.963, "dur": 1.389, "args": { "External id": 20725,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3316 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362208.460, "dur": 0.817, "args": { "External id": 20726,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3317 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362213.295, "dur": 4.031, "args": { "External id": 20727,"Record function id": 0, "Ev Idx": 3318 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362214.532, "dur": 2.360, "args": { "External id": 20728,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362215.037, "dur": 1.416, "args": { "External id": 20729,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3320 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362215.479, "dur": 0.900, "args": { "External id": 20730,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3321 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362223.812, "dur": 3.713, "args": { "External id": 20731,"Record function id": 0, "Ev Idx": 3322 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362224.763, "dur": 2.341, "args": { "External id": 20732,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362225.198, "dur": 1.498, "args": { "External id": 20733,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3324 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362225.825, "dur": 0.796, "args": { "External id": 20734,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3325 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362249.113, "dur": 6.505, "args": { "External id": 20735,"Record function id": 0, "Ev Idx": 3326 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362250.811, "dur": 4.110, "args": { "External id": 20736,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362251.892, "dur": 2.219, "args": { "External id": 20737,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3328 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362252.345, "dur": 1.613, "args": { "External id": 20738,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3329 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362258.812, "dur": 4.409, "args": { "External id": 20739,"Record function id": 0, "Ev Idx": 3330 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362259.724, "dur": 3.081, "args": { "External id": 20740,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362260.425, "dur": 1.929, "args": { "External id": 20741,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3332 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362260.810, "dur": 1.471, "args": { "External id": 20742,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3333 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362266.612, "dur": 6.822, "args": { "External id": 20743,"Record function id": 0, "Ev Idx": 3334 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651362268.035, "dur": 4.994, "args": { "External id": 20744,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362268.719, "dur": 3.786, "args": { "External id": 20745,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3336 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651362271.190, "dur": 1.216, "args": { "External id": 20746,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3337 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651362277.249, "dur": 36915.661, "args": { "External id": 20747,"Record function id": 0, "Sequence number": 246573, "Fwd thread id": 1, "Ev Idx": 3338 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651362278.418, "dur": 36906.475, "args": { "External id": 20748,"Sequence number": 246573, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3339 } }, { "ph": "f", "id": 195, "pid": 1336759, "tid": 1381173, "ts": 1295651362278.418, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.16)", "pid": 1336759, "tid": 1381173, "ts": 1295651362311.475, "dur": 41.464, "args": { "External id": 20749,"Record function id": 0, "Ev Idx": 3340 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.16)", "pid": 1336759, "tid": 1381173, "ts": 1295651362361.056, "dur": 60.914, "args": { "External id": 20750,"Record function id": 0, "Ev Idx": 3341 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.16)", "pid": 1336759, "tid": 1381173, "ts": 1295651362427.779, "dur": 36748.415, "args": { "External id": 20751,"Record function id": 0, "Ev Idx": 3342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651362514.294, "dur": 6.835, "args": { "External id": 20752,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651362530.679, "dur": 4.953, "args": { "External id": 20753,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3344 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651362549.705, "dur": 35653.659, "args": { "External id": 20754,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651362563.453, "dur": 35630.981, "args": { "External id": 20755,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651362614.496, "dur": 14.243, "args": { "External id": 20756,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651362635.118, "dur": 35524.136, "args": { "External id": 20757,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651362637.664, "dur": 35521.017, "args": { "External id": 20758,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651362641.920, "dur": 5.653, "args": { "External id": 20759,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651362649.285, "dur": 35505.751, "args": { "External id": 20760,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651398305.485, "dur": 8.814, "args": { "External id": 20761,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651398308.377, "dur": 5.376, "args": { "External id": 20762,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3353 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651398342.124, "dur": 480.487, "args": { "External id": 20763,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3354 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651398373.350, "dur": 443.919, "args": { "External id": 20764,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3355, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651398384.177, "dur": 426.196, "args": { "External id": 20765,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3356 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651398855.041, "dur": 2.467, "args": { "External id": 20766,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3357, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651398925.699, "dur": 7.355, "args": { "External id": 20767,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399016.541, "dur": 2.557, "args": { "External id": 20768,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399039.583, "dur": 1.362, "args": { "External id": 20769,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399052.451, "dur": 1.636, "args": { "External id": 20770,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399063.531, "dur": 1.309, "args": { "External id": 20771,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399074.450, "dur": 1.063, "args": { "External id": 20772,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399084.568, "dur": 1.069, "args": { "External id": 20773,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399095.682, "dur": 1.550, "args": { "External id": 20774,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399108.125, "dur": 1.889, "args": { "External id": 20775,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3366 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651399209.557, "dur": 2628.947, "args": { "External id": 20776,"Record function id": 0, "Ev Idx": 3367 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.15)", "pid": 1336759, "tid": 1381173, "ts": 1295651399243.728, "dur": 981.617, "args": { "External id": 20777,"Record function id": 0, "Ev Idx": 3368 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.15)", "pid": 1336759, "tid": 1381173, "ts": 1295651399261.203, "dur": 312.897, "args": { "External id": 20778,"Record function id": 0, "Ev Idx": 3369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651399342.095, "dur": 5.619, "args": { "External id": 20779,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651399351.255, "dur": 1.497, "args": { "External id": 20780,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651399354.380, "dur": 1.256, "args": { "External id": 20781,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651399357.210, "dur": 0.727, "args": { "External id": 20782,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651399361.238, "dur": 1.760, "args": { "External id": 20783,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651399364.496, "dur": 1.345, "args": { "External id": 20784,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651399367.393, "dur": 1.347, "args": { "External id": 20785,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651399369.985, "dur": 0.931, "args": { "External id": 20786,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651399373.859, "dur": 1.354, "args": { "External id": 20787,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651399376.478, "dur": 1.369, "args": { "External id": 20788,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3379 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651399396.480, "dur": 148.238, "args": { "External id": 20789,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651399411.654, "dur": 128.486, "args": { "External id": 20790,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651399429.909, "dur": 13.764, "args": { "External id": 20791,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651399446.537, "dur": 66.238, "args": { "External id": 20792,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651399448.995, "dur": 63.456, "args": { "External id": 20793,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399452.417, "dur": 5.204, "args": { "External id": 20794,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651399461.102, "dur": 50.517, "args": { "External id": 20795,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3386 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.14", "pid": 1336759, "tid": 1381173, "ts": 1295651399652.192, "dur": 565.268, "args": { "External id": 20796,"Record function id": 0, "Ev Idx": 3387 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.14)", "pid": 1336759, "tid": 1381173, "ts": 1295651399667.878, "dur": 536.013, "args": { "External id": 20797,"Record function id": 0, "Ev Idx": 3388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651399720.405, "dur": 4.948, "args": { "External id": 20798,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651399741.451, "dur": 25.688, "args": { "External id": 20799,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399746.213, "dur": 1.912, "args": { "External id": 20800,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399750.160, "dur": 0.285, "args": { "External id": 20801,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399751.591, "dur": 0.494, "args": { "External id": 20802,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399753.196, "dur": 0.783, "args": { "External id": 20803,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399754.830, "dur": 0.938, "args": { "External id": 20804,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399757.094, "dur": 0.379, "args": { "External id": 20805,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399758.120, "dur": 1.091, "args": { "External id": 20806,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399760.523, "dur": 0.665, "args": { "External id": 20807,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399762.166, "dur": 1.019, "args": { "External id": 20808,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651399776.419, "dur": 28.227, "args": { "External id": 20809,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3400 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651399834.921, "dur": 94.313, "args": { "External id": 20810,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651399844.101, "dur": 3.256, "args": { "External id": 20811,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651399852.368, "dur": 11.353, "args": { "External id": 20812,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651399856.625, "dur": 6.627, "args": { "External id": 20813,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399860.479, "dur": 1.086, "args": { "External id": 20814,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651399870.452, "dur": 24.429, "args": { "External id": 20815,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399871.959, "dur": 0.398, "args": { "External id": 20816,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399873.625, "dur": 0.877, "args": { "External id": 20817,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399875.560, "dur": 0.827, "args": { "External id": 20818,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399877.678, "dur": 0.731, "args": { "External id": 20819,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399879.430, "dur": 0.692, "args": { "External id": 20820,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399881.012, "dur": 0.780, "args": { "External id": 20821,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399882.654, "dur": 0.981, "args": { "External id": 20822,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399884.601, "dur": 0.829, "args": { "External id": 20823,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651399886.750, "dur": 0.664, "args": { "External id": 20824,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651399904.580, "dur": 17.855, "args": { "External id": 20825,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3416 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651399969.494, "dur": 159.201, "args": { "External id": 20826,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3417 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651400037.514, "dur": 87.509, "args": { "External id": 20827,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3418, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651400048.169, "dur": 72.856, "args": { "External id": 20828,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3419 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651400146.188, "dur": 1.933, "args": { "External id": 20829,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3420, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651400248.094, "dur": 1570.970, "args": { "External id": 20830,"Sequence number": 246572, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3421 } }, { "ph": "f", "id": 196, "pid": 1336759, "tid": 1381173, "ts": 1295651400248.094, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651400360.126, "dur": 105.349, "args": { "External id": 20831,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3422 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651400508.095, "dur": 36.956, "args": { "External id": 20832,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651400563.292, "dur": 47.462, "args": { "External id": 20833,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651400620.150, "dur": 36.980, "args": { "External id": 20834,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651400663.846, "dur": 44.227, "args": { "External id": 20835,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651400714.790, "dur": 26.994, "args": { "External id": 20836,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651400749.393, "dur": 40.708, "args": { "External id": 20837,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3428 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651400816.147, "dur": 21.324, "args": { "External id": 20838,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3429 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651400856.955, "dur": 27.539, "args": { "External id": 20839,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3430 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651400906.014, "dur": 18.335, "args": { "External id": 20840,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3431 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651400938.029, "dur": 14.928, "args": { "External id": 20841,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651400962.407, "dur": 66.555, "args": { "External id": 20842,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651401034.568, "dur": 36.260, "args": { "External id": 20843,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3434 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651401108.174, "dur": 182.261, "args": { "External id": 20844,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651401186.955, "dur": 5.719, "args": { "External id": 20845,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651401194.609, "dur": 2.555, "args": { "External id": 20846,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3437 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651401323.009, "dur": 25.434, "args": { "External id": 20847,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3438 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651401361.379, "dur": 15.106, "args": { "External id": 20848,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651401386.212, "dur": 41.504, "args": { "External id": 20849,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651401434.856, "dur": 34.765, "args": { "External id": 20850,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651401476.877, "dur": 19.462, "args": { "External id": 20851,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651401501.026, "dur": 29.263, "args": { "External id": 20852,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651401536.097, "dur": 19.019, "args": { "External id": 20853,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651401560.581, "dur": 28.500, "args": { "External id": 20854,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3445 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651401623.843, "dur": 26.885, "args": { "External id": 20855,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3446 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651401670.954, "dur": 25.089, "args": { "External id": 20856,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3447 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651401712.060, "dur": 16.880, "args": { "External id": 20857,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3448 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651401746.959, "dur": 13.984, "args": { "External id": 20858,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3449 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651401774.085, "dur": 17.558, "args": { "External id": 20859,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3450 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401864.840, "dur": 15.060, "args": { "External id": 20860,"Record function id": 0, "Ev Idx": 3451 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401867.925, "dur": 10.870, "args": { "External id": 20861,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401872.074, "dur": 5.777, "args": { "External id": 20862,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3453 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401873.414, "dur": 4.357, "args": { "External id": 20863,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3454 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401883.875, "dur": 4.689, "args": { "External id": 20864,"Record function id": 0, "Ev Idx": 3455 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401885.238, "dur": 2.879, "args": { "External id": 20865,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401885.949, "dur": 1.710, "args": { "External id": 20866,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3457 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401886.582, "dur": 0.975, "args": { "External id": 20867,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3458 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401891.825, "dur": 4.270, "args": { "External id": 20868,"Record function id": 0, "Ev Idx": 3459 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401892.891, "dur": 2.759, "args": { "External id": 20869,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401893.640, "dur": 1.597, "args": { "External id": 20870,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3461 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401894.268, "dur": 0.882, "args": { "External id": 20871,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3462 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401899.319, "dur": 3.990, "args": { "External id": 20872,"Record function id": 0, "Ev Idx": 3463 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401900.503, "dur": 2.400, "args": { "External id": 20873,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401901.082, "dur": 1.401, "args": { "External id": 20874,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3465 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401901.817, "dur": 0.600, "args": { "External id": 20875,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3466 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401909.408, "dur": 4.274, "args": { "External id": 20876,"Record function id": 0, "Ev Idx": 3467 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401910.699, "dur": 2.561, "args": { "External id": 20877,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401911.254, "dur": 1.576, "args": { "External id": 20878,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3469 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401912.107, "dur": 0.656, "args": { "External id": 20879,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3470 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401916.673, "dur": 4.013, "args": { "External id": 20880,"Record function id": 0, "Ev Idx": 3471 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401917.960, "dur": 2.329, "args": { "External id": 20881,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401918.583, "dur": 1.286, "args": { "External id": 20882,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3473 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401919.224, "dur": 0.569, "args": { "External id": 20883,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3474 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401923.730, "dur": 3.632, "args": { "External id": 20884,"Record function id": 0, "Ev Idx": 3475 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401924.862, "dur": 2.100, "args": { "External id": 20885,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401925.332, "dur": 1.198, "args": { "External id": 20886,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3477 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401925.726, "dur": 0.738, "args": { "External id": 20887,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3478 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401930.382, "dur": 3.846, "args": { "External id": 20888,"Record function id": 0, "Ev Idx": 3479 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401931.359, "dur": 2.469, "args": { "External id": 20889,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401931.891, "dur": 1.533, "args": { "External id": 20890,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3481 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401932.273, "dur": 1.084, "args": { "External id": 20891,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3482 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401937.499, "dur": 5.819, "args": { "External id": 20892,"Record function id": 0, "Ev Idx": 3483 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651401938.617, "dur": 4.298, "args": { "External id": 20893,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401939.206, "dur": 3.300, "args": { "External id": 20894,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3485 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651401941.661, "dur": 0.773, "args": { "External id": 20895,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3486 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651401946.764, "dur": 36520.349, "args": { "External id": 20896,"Record function id": 0, "Sequence number": 246571, "Fwd thread id": 1, "Ev Idx": 3487 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651401947.852, "dur": 36510.883, "args": { "External id": 20897,"Sequence number": 246571, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3488 } }, { "ph": "f", "id": 197, "pid": 1336759, "tid": 1381173, "ts": 1295651401947.852, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.15)", "pid": 1336759, "tid": 1381173, "ts": 1295651401978.097, "dur": 82.518, "args": { "External id": 20898,"Record function id": 0, "Ev Idx": 3489 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.15)", "pid": 1336759, "tid": 1381173, "ts": 1295651402070.138, "dur": 64.132, "args": { "External id": 20899,"Record function id": 0, "Ev Idx": 3490 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.15)", "pid": 1336759, "tid": 1381173, "ts": 1295651402140.156, "dur": 36309.749, "args": { "External id": 20900,"Record function id": 0, "Ev Idx": 3491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651402248.762, "dur": 8.377, "args": { "External id": 20901,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651402268.244, "dur": 5.589, "args": { "External id": 20902,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3493 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651402289.056, "dur": 35240.670, "args": { "External id": 20903,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651402302.642, "dur": 35218.102, "args": { "External id": 20904,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651402352.479, "dur": 14.117, "args": { "External id": 20905,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651402372.970, "dur": 35111.447, "args": { "External id": 20906,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651402375.437, "dur": 35108.484, "args": { "External id": 20907,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651402379.329, "dur": 5.271, "args": { "External id": 20908,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651402386.232, "dur": 35094.155, "args": { "External id": 20909,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651437620.131, "dur": 8.890, "args": { "External id": 20910,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651437622.718, "dur": 5.853, "args": { "External id": 20911,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3502 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651437655.698, "dur": 476.594, "args": { "External id": 20912,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3503 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651437686.625, "dur": 439.954, "args": { "External id": 20913,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3504, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651437697.376, "dur": 422.992, "args": { "External id": 20914,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3505 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651438159.186, "dur": 2.257, "args": { "External id": 20915,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3506, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651438226.142, "dur": 21.934, "args": { "External id": 20916,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651438297.619, "dur": 2.128, "args": { "External id": 20917,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651438314.878, "dur": 1.571, "args": { "External id": 20918,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651438328.124, "dur": 1.458, "args": { "External id": 20919,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651438339.668, "dur": 1.182, "args": { "External id": 20920,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651438349.823, "dur": 0.918, "args": { "External id": 20921,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651438362.104, "dur": 1.158, "args": { "External id": 20922,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651438373.151, "dur": 1.628, "args": { "External id": 20923,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651438385.524, "dur": 1.909, "args": { "External id": 20924,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3515 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651438483.768, "dur": 2677.603, "args": { "External id": 20925,"Record function id": 0, "Ev Idx": 3516 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.14)", "pid": 1336759, "tid": 1381173, "ts": 1295651438502.414, "dur": 1001.081, "args": { "External id": 20926,"Record function id": 0, "Ev Idx": 3517 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.14)", "pid": 1336759, "tid": 1381173, "ts": 1295651438517.211, "dur": 304.374, "args": { "External id": 20927,"Record function id": 0, "Ev Idx": 3518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651438591.299, "dur": 5.450, "args": { "External id": 20928,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651438599.930, "dur": 1.461, "args": { "External id": 20929,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651438603.123, "dur": 1.383, "args": { "External id": 20930,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651438606.349, "dur": 1.140, "args": { "External id": 20931,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651438610.424, "dur": 1.571, "args": { "External id": 20932,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651438613.524, "dur": 1.485, "args": { "External id": 20933,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651438616.427, "dur": 1.617, "args": { "External id": 20934,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651438619.821, "dur": 1.217, "args": { "External id": 20935,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651438624.182, "dur": 1.509, "args": { "External id": 20936,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651438627.226, "dur": 1.521, "args": { "External id": 20937,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3528 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651438646.673, "dur": 147.322, "args": { "External id": 20938,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651438661.445, "dur": 127.922, "args": { "External id": 20939,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651438680.889, "dur": 13.830, "args": { "External id": 20940,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651438697.959, "dur": 65.347, "args": { "External id": 20941,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651438700.672, "dur": 62.273, "args": { "External id": 20942,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651438704.456, "dur": 5.367, "args": { "External id": 20943,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651438713.655, "dur": 48.618, "args": { "External id": 20944,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3535 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.13", "pid": 1336759, "tid": 1381173, "ts": 1295651438896.445, "dur": 599.280, "args": { "External id": 20945,"Record function id": 0, "Ev Idx": 3536 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.13)", "pid": 1336759, "tid": 1381173, "ts": 1295651438913.365, "dur": 568.425, "args": { "External id": 20946,"Record function id": 0, "Ev Idx": 3537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651438965.332, "dur": 5.381, "args": { "External id": 20947,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651439025.919, "dur": 24.144, "args": { "External id": 20948,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439030.447, "dur": 2.459, "args": { "External id": 20949,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439034.367, "dur": 0.548, "args": { "External id": 20950,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439035.920, "dur": 0.388, "args": { "External id": 20951,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439037.109, "dur": 0.372, "args": { "External id": 20952,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439038.491, "dur": 0.359, "args": { "External id": 20953,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439040.038, "dur": 0.206, "args": { "External id": 20954,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439041.234, "dur": 0.741, "args": { "External id": 20955,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439043.174, "dur": 0.673, "args": { "External id": 20956,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439044.844, "dur": 0.767, "args": { "External id": 20957,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651439059.602, "dur": 32.573, "args": { "External id": 20958,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3549 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651439124.035, "dur": 102.263, "args": { "External id": 20959,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651439134.109, "dur": 4.497, "args": { "External id": 20960,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651439146.472, "dur": 10.502, "args": { "External id": 20961,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651439150.582, "dur": 5.936, "args": { "External id": 20962,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439153.743, "dur": 0.898, "args": { "External id": 20963,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651439165.985, "dur": 24.637, "args": { "External id": 20964,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439167.583, "dur": 0.440, "args": { "External id": 20965,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439169.136, "dur": 0.771, "args": { "External id": 20966,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439170.947, "dur": 0.589, "args": { "External id": 20967,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439173.110, "dur": 0.603, "args": { "External id": 20968,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439175.214, "dur": 0.783, "args": { "External id": 20969,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3560 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439177.301, "dur": 0.415, "args": { "External id": 20970,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439178.871, "dur": 0.747, "args": { "External id": 20971,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439180.458, "dur": 0.832, "args": { "External id": 20972,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651439182.483, "dur": 0.584, "args": { "External id": 20973,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651439201.432, "dur": 17.744, "args": { "External id": 20974,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3565 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651439290.411, "dur": 119.948, "args": { "External id": 20975,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3566 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651439319.609, "dur": 87.143, "args": { "External id": 20976,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3567, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651439329.135, "dur": 73.483, "args": { "External id": 20977,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3568 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651439427.754, "dur": 1.780, "args": { "External id": 20978,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3569, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651439510.095, "dur": 1628.601, "args": { "External id": 20979,"Sequence number": 246570, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3570 } }, { "ph": "f", "id": 198, "pid": 1336759, "tid": 1381173, "ts": 1295651439510.095, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651439615.628, "dur": 102.285, "args": { "External id": 20980,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3571 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651439758.522, "dur": 36.503, "args": { "External id": 20981,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651439810.066, "dur": 50.349, "args": { "External id": 20982,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651439869.213, "dur": 32.832, "args": { "External id": 20983,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651439907.838, "dur": 43.498, "args": { "External id": 20984,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651439958.199, "dur": 67.427, "args": { "External id": 20985,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651440037.438, "dur": 45.825, "args": { "External id": 20986,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3577 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651440110.057, "dur": 22.492, "args": { "External id": 20987,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3578 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651440151.761, "dur": 26.823, "args": { "External id": 20988,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3579 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651440199.792, "dur": 18.779, "args": { "External id": 20989,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3580 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651440249.246, "dur": 18.314, "args": { "External id": 20990,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651440278.584, "dur": 31.582, "args": { "External id": 20991,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651440313.849, "dur": 32.390, "args": { "External id": 20992,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3583 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651440397.237, "dur": 166.765, "args": { "External id": 20993,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651440475.645, "dur": 6.110, "args": { "External id": 20994,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651440483.603, "dur": 2.441, "args": { "External id": 20995,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3586 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651440595.575, "dur": 24.100, "args": { "External id": 20996,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3587 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651440631.093, "dur": 13.982, "args": { "External id": 20997,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651440656.567, "dur": 34.582, "args": { "External id": 20998,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651440698.711, "dur": 34.306, "args": { "External id": 20999,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651440739.855, "dur": 20.472, "args": { "External id": 21000,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651440765.126, "dur": 33.748, "args": { "External id": 21001,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651440805.066, "dur": 19.301, "args": { "External id": 21002,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651440830.770, "dur": 29.385, "args": { "External id": 21003,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3594 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651440878.057, "dur": 21.976, "args": { "External id": 21004,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3595 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651440930.647, "dur": 31.102, "args": { "External id": 21005,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3596 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651441020.118, "dur": 24.360, "args": { "External id": 21006,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3597 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651441065.077, "dur": 13.806, "args": { "External id": 21007,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3598 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651441094.813, "dur": 15.937, "args": { "External id": 21008,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3599 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441184.896, "dur": 15.639, "args": { "External id": 21009,"Record function id": 0, "Ev Idx": 3600 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441188.122, "dur": 11.357, "args": { "External id": 21010,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441192.427, "dur": 6.125, "args": { "External id": 21011,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3602 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441193.595, "dur": 4.797, "args": { "External id": 21012,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3603 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441207.307, "dur": 4.315, "args": { "External id": 21013,"Record function id": 0, "Ev Idx": 3604 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441208.483, "dur": 2.721, "args": { "External id": 21014,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441209.183, "dur": 1.569, "args": { "External id": 21015,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3606 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441209.675, "dur": 1.005, "args": { "External id": 21016,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3607 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441214.848, "dur": 4.864, "args": { "External id": 21017,"Record function id": 0, "Ev Idx": 3608 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441216.161, "dur": 3.123, "args": { "External id": 21018,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441216.839, "dur": 2.008, "args": { "External id": 21019,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3610 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441217.456, "dur": 1.271, "args": { "External id": 21020,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3611 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441222.829, "dur": 3.924, "args": { "External id": 21021,"Record function id": 0, "Ev Idx": 3612 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441224.127, "dur": 2.234, "args": { "External id": 21022,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441224.663, "dur": 1.229, "args": { "External id": 21023,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3614 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441225.087, "dur": 0.691, "args": { "External id": 21024,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3615 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441247.436, "dur": 6.126, "args": { "External id": 21025,"Record function id": 0, "Ev Idx": 3616 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441248.972, "dur": 3.913, "args": { "External id": 21026,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441250.059, "dur": 1.986, "args": { "External id": 21027,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3618 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441250.473, "dur": 1.369, "args": { "External id": 21028,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3619 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441256.941, "dur": 6.918, "args": { "External id": 21029,"Record function id": 0, "Ev Idx": 3620 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441257.959, "dur": 5.488, "args": { "External id": 21030,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441258.508, "dur": 4.506, "args": { "External id": 21031,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3622 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441258.976, "dur": 3.971, "args": { "External id": 21032,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3623 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441267.145, "dur": 4.233, "args": { "External id": 21033,"Record function id": 0, "Ev Idx": 3624 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441268.256, "dur": 2.686, "args": { "External id": 21034,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441268.934, "dur": 1.594, "args": { "External id": 21035,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3626 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441269.417, "dur": 1.047, "args": { "External id": 21036,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3627 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441274.527, "dur": 3.833, "args": { "External id": 21037,"Record function id": 0, "Ev Idx": 3628 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441275.611, "dur": 2.323, "args": { "External id": 21038,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441276.260, "dur": 1.265, "args": { "External id": 21039,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3630 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441276.507, "dur": 0.954, "args": { "External id": 21040,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3631 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441281.556, "dur": 5.285, "args": { "External id": 21041,"Record function id": 0, "Ev Idx": 3632 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651441282.520, "dur": 3.914, "args": { "External id": 21042,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441283.011, "dur": 2.978, "args": { "External id": 21043,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3634 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651441285.168, "dur": 0.714, "args": { "External id": 21044,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3635 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651441290.393, "dur": 36386.723, "args": { "External id": 21045,"Record function id": 0, "Sequence number": 246569, "Fwd thread id": 1, "Ev Idx": 3636 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651441291.762, "dur": 36376.732, "args": { "External id": 21046,"Sequence number": 246569, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3637 } }, { "ph": "f", "id": 199, "pid": 1336759, "tid": 1381173, "ts": 1295651441291.762, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.14)", "pid": 1336759, "tid": 1381173, "ts": 1295651441324.688, "dur": 35.697, "args": { "External id": 21047,"Record function id": 0, "Ev Idx": 3638 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.14)", "pid": 1336759, "tid": 1381173, "ts": 1295651441368.122, "dur": 63.781, "args": { "External id": 21048,"Record function id": 0, "Ev Idx": 3639 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.14)", "pid": 1336759, "tid": 1381173, "ts": 1295651441437.713, "dur": 36222.814, "args": { "External id": 21049,"Record function id": 0, "Ev Idx": 3640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651441523.785, "dur": 7.039, "args": { "External id": 21050,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651441540.483, "dur": 5.078, "args": { "External id": 21051,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3642 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651441560.462, "dur": 35299.119, "args": { "External id": 21052,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651441573.173, "dur": 35277.846, "args": { "External id": 21053,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651441615.208, "dur": 14.090, "args": { "External id": 21054,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651441635.759, "dur": 35175.384, "args": { "External id": 21055,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651441638.457, "dur": 35172.152, "args": { "External id": 21056,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651441641.822, "dur": 5.460, "args": { "External id": 21057,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651441651.169, "dur": 35155.743, "args": { "External id": 21058,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651476946.074, "dur": 9.300, "args": { "External id": 21059,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651476949.130, "dur": 5.854, "args": { "External id": 21060,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3651 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651477005.699, "dur": 369.559, "args": { "External id": 21061,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3652 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651477037.285, "dur": 333.012, "args": { "External id": 21062,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3653, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651477049.842, "dur": 314.604, "args": { "External id": 21063,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3654 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651477398.453, "dur": 2.348, "args": { "External id": 21064,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3655, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651477461.288, "dur": 6.772, "args": { "External id": 21065,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651477515.671, "dur": 1.564, "args": { "External id": 21066,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651477531.375, "dur": 1.393, "args": { "External id": 21067,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651477544.310, "dur": 1.226, "args": { "External id": 21068,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651477554.906, "dur": 0.771, "args": { "External id": 21069,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651477564.137, "dur": 1.369, "args": { "External id": 21070,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651477574.806, "dur": 1.427, "args": { "External id": 21071,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651477585.757, "dur": 1.247, "args": { "External id": 21072,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651477597.672, "dur": 1.885, "args": { "External id": 21073,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3664 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651477691.392, "dur": 2651.327, "args": { "External id": 21074,"Record function id": 0, "Ev Idx": 3665 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.13)", "pid": 1336759, "tid": 1381173, "ts": 1295651477710.008, "dur": 987.102, "args": { "External id": 21075,"Record function id": 0, "Ev Idx": 3666 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.13)", "pid": 1336759, "tid": 1381173, "ts": 1295651477726.563, "dur": 345.459, "args": { "External id": 21076,"Record function id": 0, "Ev Idx": 3667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651477798.599, "dur": 4.426, "args": { "External id": 21077,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651477806.180, "dur": 1.123, "args": { "External id": 21078,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651477809.021, "dur": 1.195, "args": { "External id": 21079,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651477811.871, "dur": 1.487, "args": { "External id": 21080,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651477814.654, "dur": 1.351, "args": { "External id": 21081,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651477819.123, "dur": 6.509, "args": { "External id": 21082,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651477827.072, "dur": 1.053, "args": { "External id": 21083,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3674 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651477829.589, "dur": 1.456, "args": { "External id": 21084,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3675 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651477832.243, "dur": 1.102, "args": { "External id": 21085,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651477836.398, "dur": 1.207, "args": { "External id": 21086,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3677 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651477855.430, "dur": 183.229, "args": { "External id": 21087,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651477870.204, "dur": 162.950, "args": { "External id": 21088,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3679 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651477885.696, "dur": 13.114, "args": { "External id": 21089,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651477901.887, "dur": 62.971, "args": { "External id": 21090,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651477903.983, "dur": 60.515, "args": { "External id": 21091,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651477907.833, "dur": 5.691, "args": { "External id": 21092,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651477915.232, "dur": 48.585, "args": { "External id": 21093,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3684 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.12", "pid": 1336759, "tid": 1381173, "ts": 1295651478152.769, "dur": 536.109, "args": { "External id": 21094,"Record function id": 0, "Ev Idx": 3685 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.12)", "pid": 1336759, "tid": 1381173, "ts": 1295651478170.670, "dur": 506.336, "args": { "External id": 21095,"Record function id": 0, "Ev Idx": 3686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651478224.732, "dur": 22.020, "args": { "External id": 21096,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651478264.899, "dur": 25.481, "args": { "External id": 21097,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478269.767, "dur": 1.820, "args": { "External id": 21098,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478273.443, "dur": 0.253, "args": { "External id": 21099,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478274.913, "dur": 0.186, "args": { "External id": 21100,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478276.547, "dur": 0.842, "args": { "External id": 21101,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478279.032, "dur": 0.798, "args": { "External id": 21102,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478280.883, "dur": 0.660, "args": { "External id": 21103,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3694 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478282.843, "dur": 0.475, "args": { "External id": 21104,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478284.406, "dur": 0.825, "args": { "External id": 21105,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478286.238, "dur": 0.510, "args": { "External id": 21106,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651478299.449, "dur": 32.076, "args": { "External id": 21107,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3698 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651478362.729, "dur": 91.465, "args": { "External id": 21108,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651478372.754, "dur": 4.428, "args": { "External id": 21109,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651478381.591, "dur": 10.346, "args": { "External id": 21110,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651478386.433, "dur": 5.079, "args": { "External id": 21111,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478389.438, "dur": 0.663, "args": { "External id": 21112,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651478398.118, "dur": 24.215, "args": { "External id": 21113,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478399.968, "dur": 0.712, "args": { "External id": 21114,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478401.925, "dur": 0.738, "args": { "External id": 21115,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478403.751, "dur": 0.402, "args": { "External id": 21116,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478405.159, "dur": 0.590, "args": { "External id": 21117,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478407.189, "dur": 0.907, "args": { "External id": 21118,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478409.121, "dur": 0.981, "args": { "External id": 21119,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478410.910, "dur": 0.646, "args": { "External id": 21120,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478412.649, "dur": 0.600, "args": { "External id": 21121,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651478414.591, "dur": 0.704, "args": { "External id": 21122,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651478430.095, "dur": 16.790, "args": { "External id": 21123,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3714 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651478497.232, "dur": 112.736, "args": { "External id": 21124,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3715 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651478523.982, "dur": 82.482, "args": { "External id": 21125,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3716, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651478532.625, "dur": 69.718, "args": { "External id": 21126,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3717 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651478626.663, "dur": 1.784, "args": { "External id": 21127,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3718, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651478704.649, "dur": 1618.253, "args": { "External id": 21128,"Sequence number": 246568, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3719 } }, { "ph": "f", "id": 200, "pid": 1336759, "tid": 1381173, "ts": 1295651478704.649, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651478808.629, "dur": 101.236, "args": { "External id": 21129,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3720 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651478947.478, "dur": 75.453, "args": { "External id": 21130,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651479042.609, "dur": 60.980, "args": { "External id": 21131,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651479114.309, "dur": 32.768, "args": { "External id": 21132,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651479156.333, "dur": 44.802, "args": { "External id": 21133,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651479207.579, "dur": 41.951, "args": { "External id": 21134,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651479260.131, "dur": 44.603, "args": { "External id": 21135,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3726 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651479334.837, "dur": 22.382, "args": { "External id": 21136,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3727 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651479375.480, "dur": 26.985, "args": { "External id": 21137,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3728 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651479424.155, "dur": 19.222, "args": { "External id": 21138,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3729 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651479455.344, "dur": 15.492, "args": { "External id": 21139,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651479479.570, "dur": 27.849, "args": { "External id": 21140,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651479510.704, "dur": 31.912, "args": { "External id": 21141,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3732 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651479568.729, "dur": 163.350, "args": { "External id": 21142,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651479646.118, "dur": 5.781, "args": { "External id": 21143,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651479654.020, "dur": 2.034, "args": { "External id": 21144,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3735 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651479761.294, "dur": 24.538, "args": { "External id": 21145,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3736 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651479802.019, "dur": 13.334, "args": { "External id": 21146,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651479823.569, "dur": 31.705, "args": { "External id": 21147,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651479860.837, "dur": 32.977, "args": { "External id": 21148,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651479900.368, "dur": 20.159, "args": { "External id": 21149,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651479924.962, "dur": 28.902, "args": { "External id": 21150,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651479959.653, "dur": 19.221, "args": { "External id": 21151,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651480025.923, "dur": 35.074, "args": { "External id": 21152,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3743 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651480083.452, "dur": 22.040, "args": { "External id": 21153,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3744 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651480126.937, "dur": 21.464, "args": { "External id": 21154,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3745 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651480178.069, "dur": 27.402, "args": { "External id": 21155,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3746 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651480227.190, "dur": 31.671, "args": { "External id": 21156,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3747 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651480274.101, "dur": 18.380, "args": { "External id": 21157,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3748 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480369.355, "dur": 15.219, "args": { "External id": 21158,"Record function id": 0, "Ev Idx": 3749 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480372.423, "dur": 11.074, "args": { "External id": 21159,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480376.529, "dur": 5.899, "args": { "External id": 21160,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3751 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480377.753, "dur": 4.576, "args": { "External id": 21161,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3752 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480388.464, "dur": 4.190, "args": { "External id": 21162,"Record function id": 0, "Ev Idx": 3753 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480389.580, "dur": 2.648, "args": { "External id": 21163,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480390.373, "dur": 1.327, "args": { "External id": 21164,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3755 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480390.770, "dur": 0.826, "args": { "External id": 21165,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3756 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480395.845, "dur": 4.102, "args": { "External id": 21166,"Record function id": 0, "Ev Idx": 3757 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480397.162, "dur": 2.313, "args": { "External id": 21167,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480397.623, "dur": 1.395, "args": { "External id": 21168,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3759 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480398.143, "dur": 0.797, "args": { "External id": 21169,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3760 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480403.060, "dur": 7.023, "args": { "External id": 21170,"Record function id": 0, "Ev Idx": 3761 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480407.532, "dur": 2.142, "args": { "External id": 21171,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480408.028, "dur": 1.222, "args": { "External id": 21172,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3763 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480408.559, "dur": 0.621, "args": { "External id": 21173,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3764 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480413.154, "dur": 3.475, "args": { "External id": 21174,"Record function id": 0, "Ev Idx": 3765 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480414.156, "dur": 2.018, "args": { "External id": 21175,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480414.630, "dur": 1.103, "args": { "External id": 21176,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3767 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480414.891, "dur": 0.778, "args": { "External id": 21177,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3768 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480419.709, "dur": 3.417, "args": { "External id": 21178,"Record function id": 0, "Ev Idx": 3769 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480420.684, "dur": 2.018, "args": { "External id": 21179,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480421.146, "dur": 1.090, "args": { "External id": 21180,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3771 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480421.497, "dur": 0.679, "args": { "External id": 21181,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3772 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480426.259, "dur": 5.735, "args": { "External id": 21182,"Record function id": 0, "Ev Idx": 3773 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480427.372, "dur": 4.235, "args": { "External id": 21183,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480427.794, "dur": 3.395, "args": { "External id": 21184,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3775 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480430.365, "dur": 0.752, "args": { "External id": 21185,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3776 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480435.129, "dur": 3.933, "args": { "External id": 21186,"Record function id": 0, "Ev Idx": 3777 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480436.267, "dur": 2.400, "args": { "External id": 21187,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480436.941, "dur": 1.310, "args": { "External id": 21188,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3779 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480437.511, "dur": 0.663, "args": { "External id": 21189,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3780 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480442.132, "dur": 3.786, "args": { "External id": 21190,"Record function id": 0, "Ev Idx": 3781 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651480443.287, "dur": 2.217, "args": { "External id": 21191,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480443.754, "dur": 1.289, "args": { "External id": 21192,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3783 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651480444.027, "dur": 0.948, "args": { "External id": 21193,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3784 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651480449.477, "dur": 38231.712, "args": { "External id": 21194,"Record function id": 0, "Sequence number": 246567, "Fwd thread id": 1, "Ev Idx": 3785 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651480450.658, "dur": 38222.797, "args": { "External id": 21195,"Sequence number": 246567, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3786 } }, { "ph": "f", "id": 201, "pid": 1336759, "tid": 1381173, "ts": 1295651480450.658, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.13)", "pid": 1336759, "tid": 1381173, "ts": 1295651480482.499, "dur": 42.063, "args": { "External id": 21196,"Record function id": 0, "Ev Idx": 3787 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.13)", "pid": 1336759, "tid": 1381173, "ts": 1295651480532.319, "dur": 64.471, "args": { "External id": 21197,"Record function id": 0, "Ev Idx": 3788 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.13)", "pid": 1336759, "tid": 1381173, "ts": 1295651480602.964, "dur": 38062.971, "args": { "External id": 21198,"Record function id": 0, "Ev Idx": 3789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651480689.116, "dur": 6.787, "args": { "External id": 21199,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651480705.547, "dur": 4.754, "args": { "External id": 21200,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3791 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651480724.838, "dur": 37046.227, "args": { "External id": 21201,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651480737.329, "dur": 37024.636, "args": { "External id": 21202,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651480780.507, "dur": 13.862, "args": { "External id": 21203,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651480800.551, "dur": 36925.352, "args": { "External id": 21204,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651480803.239, "dur": 36922.074, "args": { "External id": 21205,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651480807.523, "dur": 8.490, "args": { "External id": 21206,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651480817.656, "dur": 36903.853, "args": { "External id": 21207,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651517864.860, "dur": 8.895, "args": { "External id": 21208,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651517867.699, "dur": 5.714, "args": { "External id": 21209,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3800 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651517902.623, "dur": 467.653, "args": { "External id": 21210,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3801 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651517933.845, "dur": 430.850, "args": { "External id": 21211,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3802, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651517944.859, "dur": 413.784, "args": { "External id": 21212,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3803 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651518393.897, "dur": 2.716, "args": { "External id": 21213,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3804, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651518462.120, "dur": 7.140, "args": { "External id": 21214,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651518514.121, "dur": 1.785, "args": { "External id": 21215,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651518531.445, "dur": 1.199, "args": { "External id": 21216,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651518544.601, "dur": 1.279, "args": { "External id": 21217,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651518555.324, "dur": 1.446, "args": { "External id": 21218,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651518565.836, "dur": 1.417, "args": { "External id": 21219,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651518576.588, "dur": 1.209, "args": { "External id": 21220,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651518590.262, "dur": 1.680, "args": { "External id": 21221,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651518602.693, "dur": 1.321, "args": { "External id": 21222,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3813 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651518695.823, "dur": 2658.813, "args": { "External id": 21223,"Record function id": 0, "Ev Idx": 3814 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.12)", "pid": 1336759, "tid": 1381173, "ts": 1295651518714.858, "dur": 1003.970, "args": { "External id": 21224,"Record function id": 0, "Ev Idx": 3815 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.12)", "pid": 1336759, "tid": 1381173, "ts": 1295651518730.667, "dur": 352.207, "args": { "External id": 21225,"Record function id": 0, "Ev Idx": 3816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651518807.636, "dur": 4.453, "args": { "External id": 21226,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651518815.064, "dur": 1.266, "args": { "External id": 21227,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651518817.943, "dur": 1.200, "args": { "External id": 21228,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651518820.800, "dur": 1.630, "args": { "External id": 21229,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651518823.788, "dur": 1.174, "args": { "External id": 21230,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651518828.450, "dur": 1.230, "args": { "External id": 21231,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651518831.548, "dur": 1.327, "args": { "External id": 21232,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651518834.331, "dur": 1.437, "args": { "External id": 21233,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651518837.354, "dur": 1.461, "args": { "External id": 21234,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651518842.126, "dur": 1.162, "args": { "External id": 21235,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3826 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651518860.811, "dur": 189.460, "args": { "External id": 21236,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651518876.485, "dur": 167.821, "args": { "External id": 21237,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651518893.865, "dur": 13.633, "args": { "External id": 21238,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651518910.690, "dur": 64.141, "args": { "External id": 21239,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651518913.112, "dur": 61.418, "args": { "External id": 21240,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651518916.765, "dur": 5.518, "args": { "External id": 21241,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651518923.812, "dur": 50.075, "args": { "External id": 21242,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3833 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.11", "pid": 1336759, "tid": 1381173, "ts": 1295651519166.811, "dur": 544.317, "args": { "External id": 21243,"Record function id": 0, "Ev Idx": 3834 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.11)", "pid": 1336759, "tid": 1381173, "ts": 1295651519184.413, "dur": 514.493, "args": { "External id": 21244,"Record function id": 0, "Ev Idx": 3835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651519258.732, "dur": 7.347, "args": { "External id": 21245,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651519282.243, "dur": 27.028, "args": { "External id": 21246,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519287.265, "dur": 1.881, "args": { "External id": 21247,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519291.623, "dur": 0.310, "args": { "External id": 21248,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519293.523, "dur": 0.203, "args": { "External id": 21249,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519294.928, "dur": 0.447, "args": { "External id": 21250,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519296.914, "dur": 0.485, "args": { "External id": 21251,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519298.991, "dur": 0.677, "args": { "External id": 21252,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519300.889, "dur": 0.981, "args": { "External id": 21253,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519303.129, "dur": 0.877, "args": { "External id": 21254,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519305.165, "dur": 0.536, "args": { "External id": 21255,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651519318.660, "dur": 31.000, "args": { "External id": 21256,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3847 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651519380.666, "dur": 92.290, "args": { "External id": 21257,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651519390.113, "dur": 3.565, "args": { "External id": 21258,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651519398.271, "dur": 10.534, "args": { "External id": 21259,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651519402.886, "dur": 5.521, "args": { "External id": 21260,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519406.026, "dur": 0.868, "args": { "External id": 21261,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651519415.388, "dur": 24.491, "args": { "External id": 21262,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519417.269, "dur": 0.618, "args": { "External id": 21263,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519419.101, "dur": 0.810, "args": { "External id": 21264,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519421.285, "dur": 0.624, "args": { "External id": 21265,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519422.800, "dur": 0.815, "args": { "External id": 21266,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519424.971, "dur": 0.567, "args": { "External id": 21267,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519427.018, "dur": 0.675, "args": { "External id": 21268,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519429.020, "dur": 0.889, "args": { "External id": 21269,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519431.135, "dur": 0.678, "args": { "External id": 21270,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651519432.787, "dur": 0.648, "args": { "External id": 21271,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651519448.556, "dur": 16.962, "args": { "External id": 21272,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3863 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651519517.163, "dur": 113.823, "args": { "External id": 21273,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3864 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651519543.544, "dur": 83.947, "args": { "External id": 21274,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3865, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651519553.354, "dur": 70.183, "args": { "External id": 21275,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3866 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651519648.687, "dur": 1.931, "args": { "External id": 21276,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3867, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651519725.055, "dur": 1606.465, "args": { "External id": 21277,"Sequence number": 246566, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3868 } }, { "ph": "f", "id": 202, "pid": 1336759, "tid": 1381173, "ts": 1295651519725.055, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651519829.451, "dur": 104.675, "args": { "External id": 21278,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3869 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651519971.003, "dur": 80.688, "args": { "External id": 21279,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651520071.651, "dur": 55.258, "args": { "External id": 21280,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651520136.984, "dur": 32.739, "args": { "External id": 21281,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651520176.503, "dur": 44.741, "args": { "External id": 21282,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651520243.721, "dur": 32.845, "args": { "External id": 21283,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651520286.338, "dur": 41.598, "args": { "External id": 21284,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3875 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651520354.795, "dur": 22.129, "args": { "External id": 21285,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3876 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651520397.924, "dur": 26.706, "args": { "External id": 21286,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3877 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651520445.026, "dur": 17.826, "args": { "External id": 21287,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3878 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651520477.655, "dur": 13.102, "args": { "External id": 21288,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651520499.564, "dur": 26.710, "args": { "External id": 21289,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651520529.552, "dur": 31.479, "args": { "External id": 21290,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3881 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651520587.648, "dur": 163.878, "args": { "External id": 21291,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651520665.058, "dur": 5.620, "args": { "External id": 21292,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651520672.663, "dur": 2.691, "args": { "External id": 21293,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3884 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651520779.292, "dur": 22.218, "args": { "External id": 21294,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3885 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651520812.376, "dur": 14.098, "args": { "External id": 21295,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651520834.860, "dur": 31.826, "args": { "External id": 21296,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651520872.773, "dur": 32.156, "args": { "External id": 21297,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651520911.662, "dur": 19.995, "args": { "External id": 21298,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651520936.901, "dur": 28.847, "args": { "External id": 21299,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651520971.827, "dur": 58.718, "args": { "External id": 21300,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651521041.334, "dur": 33.140, "args": { "External id": 21301,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3892 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651521093.818, "dur": 21.656, "args": { "External id": 21302,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3893 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651521135.547, "dur": 36.554, "args": { "External id": 21303,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3894 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651521195.530, "dur": 19.213, "args": { "External id": 21304,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3895 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651521251.408, "dur": 17.222, "args": { "External id": 21305,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3896 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651521287.400, "dur": 16.166, "args": { "External id": 21306,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3897 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521376.392, "dur": 15.501, "args": { "External id": 21307,"Record function id": 0, "Ev Idx": 3898 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521379.829, "dur": 10.961, "args": { "External id": 21308,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521384.174, "dur": 5.738, "args": { "External id": 21309,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3900 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521385.540, "dur": 4.246, "args": { "External id": 21310,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3901 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521396.018, "dur": 4.107, "args": { "External id": 21311,"Record function id": 0, "Ev Idx": 3902 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521397.112, "dur": 2.602, "args": { "External id": 21312,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521397.860, "dur": 1.316, "args": { "External id": 21313,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3904 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521398.464, "dur": 0.601, "args": { "External id": 21314,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3905 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521403.556, "dur": 4.399, "args": { "External id": 21315,"Record function id": 0, "Ev Idx": 3906 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521404.656, "dur": 2.886, "args": { "External id": 21316,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521405.414, "dur": 1.712, "args": { "External id": 21317,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3908 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521405.969, "dur": 1.054, "args": { "External id": 21318,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3909 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521411.069, "dur": 3.820, "args": { "External id": 21319,"Record function id": 0, "Ev Idx": 3910 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521412.310, "dur": 2.192, "args": { "External id": 21320,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521412.887, "dur": 1.185, "args": { "External id": 21321,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3912 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521413.311, "dur": 0.670, "args": { "External id": 21322,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3913 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521417.902, "dur": 3.948, "args": { "External id": 21323,"Record function id": 0, "Ev Idx": 3914 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521418.942, "dur": 2.483, "args": { "External id": 21324,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521419.414, "dur": 1.534, "args": { "External id": 21325,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3916 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521419.893, "dur": 0.985, "args": { "External id": 21326,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3917 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521424.895, "dur": 4.881, "args": { "External id": 21327,"Record function id": 0, "Ev Idx": 3918 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521426.032, "dur": 3.337, "args": { "External id": 21328,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521426.761, "dur": 2.172, "args": { "External id": 21329,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3920 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521427.115, "dur": 1.753, "args": { "External id": 21330,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3921 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521432.858, "dur": 3.866, "args": { "External id": 21331,"Record function id": 0, "Ev Idx": 3922 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521434.074, "dur": 2.259, "args": { "External id": 21332,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521434.556, "dur": 1.357, "args": { "External id": 21333,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3924 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521435.017, "dur": 0.827, "args": { "External id": 21334,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3925 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521439.739, "dur": 5.186, "args": { "External id": 21335,"Record function id": 0, "Ev Idx": 3926 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521440.614, "dur": 3.898, "args": { "External id": 21336,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521441.213, "dur": 2.859, "args": { "External id": 21337,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3928 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521443.349, "dur": 0.620, "args": { "External id": 21338,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3929 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521448.014, "dur": 7.449, "args": { "External id": 21339,"Record function id": 0, "Ev Idx": 3930 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651521449.150, "dur": 5.895, "args": { "External id": 21340,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521449.627, "dur": 4.986, "args": { "External id": 21341,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3932 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651521453.643, "dur": 0.906, "args": { "External id": 21342,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3933 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651521462.463, "dur": 35783.234, "args": { "External id": 21343,"Record function id": 0, "Sequence number": 246565, "Fwd thread id": 1, "Ev Idx": 3934 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651521463.599, "dur": 35758.038, "args": { "External id": 21344,"Sequence number": 246565, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3935 } }, { "ph": "f", "id": 203, "pid": 1336759, "tid": 1381173, "ts": 1295651521463.599, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.12)", "pid": 1336759, "tid": 1381173, "ts": 1295651521491.364, "dur": 40.094, "args": { "External id": 21345,"Record function id": 0, "Ev Idx": 3936 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.12)", "pid": 1336759, "tid": 1381173, "ts": 1295651521538.582, "dur": 63.261, "args": { "External id": 21346,"Record function id": 0, "Ev Idx": 3937 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.12)", "pid": 1336759, "tid": 1381173, "ts": 1295651521607.462, "dur": 35606.346, "args": { "External id": 21347,"Record function id": 0, "Ev Idx": 3938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651521698.289, "dur": 7.077, "args": { "External id": 21348,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651521714.498, "dur": 4.829, "args": { "External id": 21349,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3940 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651521734.626, "dur": 34685.593, "args": { "External id": 21350,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651521747.169, "dur": 34664.285, "args": { "External id": 21351,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651521790.238, "dur": 13.547, "args": { "External id": 21352,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651521813.058, "dur": 34562.821, "args": { "External id": 21353,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651521815.769, "dur": 34559.237, "args": { "External id": 21354,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651521819.529, "dur": 5.664, "args": { "External id": 21355,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651521826.811, "dur": 34544.667, "args": { "External id": 21356,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651556508.565, "dur": 8.870, "args": { "External id": 21357,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651556511.313, "dur": 5.775, "args": { "External id": 21358,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3949 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651556549.891, "dur": 334.561, "args": { "External id": 21359,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3950 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651556578.112, "dur": 301.852, "args": { "External id": 21360,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3951, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651556589.141, "dur": 285.675, "args": { "External id": 21361,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3952 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651556902.999, "dur": 2.291, "args": { "External id": 21362,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3953, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651556958.982, "dur": 6.591, "args": { "External id": 21363,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557066.581, "dur": 2.499, "args": { "External id": 21364,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557084.712, "dur": 1.275, "args": { "External id": 21365,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557096.425, "dur": 0.814, "args": { "External id": 21366,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557109.329, "dur": 0.829, "args": { "External id": 21367,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557118.677, "dur": 1.061, "args": { "External id": 21368,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557128.654, "dur": 1.069, "args": { "External id": 21369,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557138.817, "dur": 1.387, "args": { "External id": 21370,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557148.896, "dur": 1.222, "args": { "External id": 21371,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3962 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651557262.939, "dur": 2557.599, "args": { "External id": 21372,"Record function id": 0, "Ev Idx": 3963 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.11)", "pid": 1336759, "tid": 1381173, "ts": 1295651557284.686, "dur": 969.794, "args": { "External id": 21373,"Record function id": 0, "Ev Idx": 3964 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.11)", "pid": 1336759, "tid": 1381173, "ts": 1295651557300.321, "dur": 302.641, "args": { "External id": 21374,"Record function id": 0, "Ev Idx": 3965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651557376.610, "dur": 5.353, "args": { "External id": 21375,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651557385.271, "dur": 1.434, "args": { "External id": 21376,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651557388.516, "dur": 0.838, "args": { "External id": 21377,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651557392.503, "dur": 1.230, "args": { "External id": 21378,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651557395.262, "dur": 1.138, "args": { "External id": 21379,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651557397.736, "dur": 1.957, "args": { "External id": 21380,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651557401.235, "dur": 1.302, "args": { "External id": 21381,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651557405.699, "dur": 0.790, "args": { "External id": 21382,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651557407.775, "dur": 1.153, "args": { "External id": 21383,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651557410.301, "dur": 1.439, "args": { "External id": 21384,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3975 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651557429.135, "dur": 144.717, "args": { "External id": 21385,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651557444.845, "dur": 124.586, "args": { "External id": 21386,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651557461.174, "dur": 12.750, "args": { "External id": 21387,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651557477.263, "dur": 65.236, "args": { "External id": 21388,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651557480.200, "dur": 61.983, "args": { "External id": 21389,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557483.997, "dur": 5.161, "args": { "External id": 21390,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651557490.990, "dur": 50.677, "args": { "External id": 21391,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3982 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.10", "pid": 1336759, "tid": 1381173, "ts": 1295651557683.312, "dur": 544.408, "args": { "External id": 21392,"Record function id": 0, "Ev Idx": 3983 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.10)", "pid": 1336759, "tid": 1381173, "ts": 1295651557698.591, "dur": 516.787, "args": { "External id": 21393,"Record function id": 0, "Ev Idx": 3984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651557750.442, "dur": 4.560, "args": { "External id": 21394,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651557770.668, "dur": 25.390, "args": { "External id": 21395,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557775.428, "dur": 1.718, "args": { "External id": 21396,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557779.421, "dur": 0.291, "args": { "External id": 21397,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557780.813, "dur": 0.312, "args": { "External id": 21398,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557782.423, "dur": 0.903, "args": { "External id": 21399,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557784.710, "dur": 0.447, "args": { "External id": 21400,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557786.593, "dur": 0.753, "args": { "External id": 21401,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557788.362, "dur": 0.704, "args": { "External id": 21402,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557790.502, "dur": 0.405, "args": { "External id": 21403,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557791.939, "dur": 0.714, "args": { "External id": 21404,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651557804.477, "dur": 27.013, "args": { "External id": 21405,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3996 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651557859.368, "dur": 89.301, "args": { "External id": 21406,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651557868.032, "dur": 2.918, "args": { "External id": 21407,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651557875.581, "dur": 9.973, "args": { "External id": 21408,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651557879.637, "dur": 5.481, "args": { "External id": 21409,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557883.031, "dur": 0.474, "args": { "External id": 21410,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651557892.129, "dur": 22.697, "args": { "External id": 21411,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557894.023, "dur": 0.606, "args": { "External id": 21412,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557896.007, "dur": 0.254, "args": { "External id": 21413,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557897.840, "dur": 0.706, "args": { "External id": 21414,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557899.784, "dur": 0.296, "args": { "External id": 21415,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557900.972, "dur": 0.622, "args": { "External id": 21416,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557902.651, "dur": 0.627, "args": { "External id": 21417,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557904.456, "dur": 0.443, "args": { "External id": 21418,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557905.812, "dur": 0.717, "args": { "External id": 21419,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651557907.650, "dur": 0.344, "args": { "External id": 21420,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651557924.050, "dur": 17.550, "args": { "External id": 21421,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4012 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651558028.413, "dur": 114.788, "args": { "External id": 21422,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4013 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651558055.040, "dur": 84.613, "args": { "External id": 21423,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4014, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651558064.827, "dur": 70.719, "args": { "External id": 21424,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4015 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651558160.010, "dur": 1.857, "args": { "External id": 21425,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4016, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651558261.889, "dur": 1536.274, "args": { "External id": 21426,"Sequence number": 246564, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4017 } }, { "ph": "f", "id": 204, "pid": 1336759, "tid": 1381173, "ts": 1295651558261.889, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651558366.514, "dur": 106.809, "args": { "External id": 21427,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4018 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651558514.013, "dur": 37.449, "args": { "External id": 21428,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651558566.227, "dur": 47.925, "args": { "External id": 21429,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651558623.400, "dur": 32.871, "args": { "External id": 21430,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651558663.372, "dur": 45.167, "args": { "External id": 21431,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651558715.203, "dur": 27.240, "args": { "External id": 21432,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651558749.587, "dur": 41.347, "args": { "External id": 21433,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4024 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651558816.485, "dur": 21.146, "args": { "External id": 21434,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4025 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651558854.878, "dur": 25.257, "args": { "External id": 21435,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4026 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651558901.809, "dur": 17.907, "args": { "External id": 21436,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4027 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651558933.279, "dur": 12.875, "args": { "External id": 21437,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651558954.697, "dur": 65.078, "args": { "External id": 21438,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651559025.477, "dur": 37.020, "args": { "External id": 21439,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4030 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651559090.004, "dur": 186.489, "args": { "External id": 21440,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651559168.992, "dur": 5.786, "args": { "External id": 21441,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651559176.645, "dur": 2.610, "args": { "External id": 21442,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4033 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651559312.308, "dur": 24.753, "args": { "External id": 21443,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4034 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651559348.581, "dur": 17.553, "args": { "External id": 21444,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651559375.284, "dur": 38.261, "args": { "External id": 21445,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651559422.415, "dur": 33.946, "args": { "External id": 21446,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651559462.835, "dur": 20.396, "args": { "External id": 21447,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651559487.793, "dur": 28.554, "args": { "External id": 21448,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651559521.942, "dur": 19.250, "args": { "External id": 21449,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651559547.328, "dur": 29.125, "args": { "External id": 21450,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4041 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651559596.891, "dur": 21.300, "args": { "External id": 21451,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4042 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651559633.829, "dur": 33.561, "args": { "External id": 21452,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4043 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651559689.950, "dur": 18.762, "args": { "External id": 21453,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4044 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651559724.948, "dur": 13.021, "args": { "External id": 21454,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4045 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651559756.149, "dur": 14.809, "args": { "External id": 21455,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4046 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559843.193, "dur": 14.642, "args": { "External id": 21456,"Record function id": 0, "Ev Idx": 4047 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559846.234, "dur": 10.671, "args": { "External id": 21457,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559850.231, "dur": 5.846, "args": { "External id": 21458,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4049 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559851.576, "dur": 4.371, "args": { "External id": 21459,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4050 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559861.869, "dur": 4.565, "args": { "External id": 21460,"Record function id": 0, "Ev Idx": 4051 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559863.366, "dur": 2.601, "args": { "External id": 21461,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559864.077, "dur": 1.421, "args": { "External id": 21462,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4053 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559864.809, "dur": 0.619, "args": { "External id": 21463,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4054 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559869.726, "dur": 4.338, "args": { "External id": 21464,"Record function id": 0, "Ev Idx": 4055 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559870.967, "dur": 2.657, "args": { "External id": 21465,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559871.486, "dur": 1.719, "args": { "External id": 21466,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4057 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559872.169, "dur": 0.938, "args": { "External id": 21467,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4058 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559877.154, "dur": 3.468, "args": { "External id": 21468,"Record function id": 0, "Ev Idx": 4059 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559878.160, "dur": 2.044, "args": { "External id": 21469,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559878.790, "dur": 0.991, "args": { "External id": 21470,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4061 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559879.101, "dur": 0.587, "args": { "External id": 21471,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4062 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559883.593, "dur": 3.531, "args": { "External id": 21472,"Record function id": 0, "Ev Idx": 4063 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559884.501, "dur": 2.166, "args": { "External id": 21473,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559884.994, "dur": 1.239, "args": { "External id": 21474,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4065 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559885.462, "dur": 0.704, "args": { "External id": 21475,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4066 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559890.106, "dur": 3.920, "args": { "External id": 21476,"Record function id": 0, "Ev Idx": 4067 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559891.140, "dur": 2.450, "args": { "External id": 21477,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559891.617, "dur": 1.593, "args": { "External id": 21478,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4069 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559891.990, "dur": 1.144, "args": { "External id": 21479,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4070 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559897.049, "dur": 3.767, "args": { "External id": 21480,"Record function id": 0, "Ev Idx": 4071 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559898.054, "dur": 2.321, "args": { "External id": 21481,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559898.724, "dur": 1.216, "args": { "External id": 21482,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4073 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559899.195, "dur": 0.679, "args": { "External id": 21483,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4074 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559903.821, "dur": 5.259, "args": { "External id": 21484,"Record function id": 0, "Ev Idx": 4075 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559904.760, "dur": 3.891, "args": { "External id": 21485,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559905.514, "dur": 2.719, "args": { "External id": 21486,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4077 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559907.616, "dur": 0.514, "args": { "External id": 21487,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4078 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559912.084, "dur": 3.520, "args": { "External id": 21488,"Record function id": 0, "Ev Idx": 4079 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651559912.976, "dur": 2.178, "args": { "External id": 21489,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559913.429, "dur": 1.336, "args": { "External id": 21490,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4081 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651559913.688, "dur": 0.995, "args": { "External id": 21491,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4082 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651559919.010, "dur": 36616.630, "args": { "External id": 21492,"Record function id": 0, "Sequence number": 246563, "Fwd thread id": 1, "Ev Idx": 4083 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651559920.183, "dur": 36604.493, "args": { "External id": 21493,"Sequence number": 246563, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4084 } }, { "ph": "f", "id": 205, "pid": 1336759, "tid": 1381173, "ts": 1295651559920.183, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.11)", "pid": 1336759, "tid": 1381173, "ts": 1295651559948.863, "dur": 73.196, "args": { "External id": 21494,"Record function id": 0, "Ev Idx": 4085 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.11)", "pid": 1336759, "tid": 1381173, "ts": 1295651560036.352, "dur": 67.767, "args": { "External id": 21495,"Record function id": 0, "Ev Idx": 4086 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.11)", "pid": 1336759, "tid": 1381173, "ts": 1295651560110.868, "dur": 36406.091, "args": { "External id": 21496,"Record function id": 0, "Ev Idx": 4087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651560199.342, "dur": 7.181, "args": { "External id": 21497,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651560216.556, "dur": 8.127, "args": { "External id": 21498,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4089 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651560259.190, "dur": 35470.593, "args": { "External id": 21499,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651560272.808, "dur": 35448.238, "args": { "External id": 21500,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651560313.725, "dur": 17.298, "args": { "External id": 21501,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651560337.284, "dur": 35346.842, "args": { "External id": 21502,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651560339.804, "dur": 35343.615, "args": { "External id": 21503,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651560343.404, "dur": 6.581, "args": { "External id": 21504,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651560371.862, "dur": 35307.944, "args": { "External id": 21505,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651595821.605, "dur": 8.665, "args": { "External id": 21506,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651595824.143, "dur": 5.675, "args": { "External id": 21507,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4098 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651595857.895, "dur": 348.512, "args": { "External id": 21508,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4099 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651595886.203, "dur": 314.855, "args": { "External id": 21509,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4100, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651595898.129, "dur": 296.899, "args": { "External id": 21510,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4101 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651596241.880, "dur": 3.245, "args": { "External id": 21511,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4102, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651596308.776, "dur": 7.137, "args": { "External id": 21512,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651596361.068, "dur": 1.422, "args": { "External id": 21513,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651596379.583, "dur": 1.179, "args": { "External id": 21514,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651596392.118, "dur": 0.882, "args": { "External id": 21515,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651596403.419, "dur": 0.885, "args": { "External id": 21516,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651596412.701, "dur": 1.128, "args": { "External id": 21517,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651596426.529, "dur": 1.174, "args": { "External id": 21518,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651596438.485, "dur": 1.070, "args": { "External id": 21519,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651596450.589, "dur": 1.390, "args": { "External id": 21520,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4111 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651596550.923, "dur": 2612.714, "args": { "External id": 21521,"Record function id": 0, "Ev Idx": 4112 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.10)", "pid": 1336759, "tid": 1381173, "ts": 1295651596569.050, "dur": 982.543, "args": { "External id": 21522,"Record function id": 0, "Ev Idx": 4113 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.10)", "pid": 1336759, "tid": 1381173, "ts": 1295651596584.158, "dur": 292.320, "args": { "External id": 21523,"Record function id": 0, "Ev Idx": 4114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651596655.223, "dur": 4.274, "args": { "External id": 21524,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651596662.460, "dur": 1.196, "args": { "External id": 21525,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651596665.407, "dur": 1.033, "args": { "External id": 21526,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651596668.021, "dur": 1.745, "args": { "External id": 21527,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651596672.732, "dur": 1.431, "args": { "External id": 21528,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651596675.362, "dur": 1.707, "args": { "External id": 21529,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651596678.552, "dur": 1.043, "args": { "External id": 21530,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651596680.847, "dur": 0.858, "args": { "External id": 21531,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4122 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651596684.529, "dur": 1.052, "args": { "External id": 21532,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651596686.941, "dur": 1.491, "args": { "External id": 21533,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4124 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651596705.460, "dur": 143.745, "args": { "External id": 21534,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651596720.769, "dur": 124.006, "args": { "External id": 21535,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651596737.048, "dur": 12.676, "args": { "External id": 21536,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651596752.857, "dur": 65.470, "args": { "External id": 21537,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651596755.682, "dur": 62.303, "args": { "External id": 21538,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651596759.344, "dur": 5.483, "args": { "External id": 21539,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651596766.335, "dur": 51.084, "args": { "External id": 21540,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4131 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.9", "pid": 1336759, "tid": 1381173, "ts": 1295651596950.847, "dur": 592.652, "args": { "External id": 21541,"Record function id": 0, "Ev Idx": 4132 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.9)", "pid": 1336759, "tid": 1381173, "ts": 1295651596966.224, "dur": 564.787, "args": { "External id": 21542,"Record function id": 0, "Ev Idx": 4133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651597063.430, "dur": 6.923, "args": { "External id": 21543,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651597086.404, "dur": 30.165, "args": { "External id": 21544,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597091.317, "dur": 6.315, "args": { "External id": 21545,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597099.535, "dur": 0.228, "args": { "External id": 21546,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597100.580, "dur": 0.316, "args": { "External id": 21547,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597101.797, "dur": 0.497, "args": { "External id": 21548,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597103.128, "dur": 0.836, "args": { "External id": 21549,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597104.904, "dur": 0.294, "args": { "External id": 21550,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597109.706, "dur": 0.298, "args": { "External id": 21551,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597110.889, "dur": 0.451, "args": { "External id": 21552,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597112.490, "dur": 0.650, "args": { "External id": 21553,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651597126.243, "dur": 33.261, "args": { "External id": 21554,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4145 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651597189.698, "dur": 112.548, "args": { "External id": 21555,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651597199.126, "dur": 3.030, "args": { "External id": 21556,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651597206.609, "dur": 10.161, "args": { "External id": 21557,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651597210.825, "dur": 5.544, "args": { "External id": 21558,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597214.154, "dur": 0.593, "args": { "External id": 21559,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651597225.666, "dur": 39.292, "args": { "External id": 21560,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597227.273, "dur": 14.884, "args": { "External id": 21561,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597244.858, "dur": 0.972, "args": { "External id": 21562,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597247.564, "dur": 0.402, "args": { "External id": 21563,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597249.633, "dur": 0.616, "args": { "External id": 21564,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597251.603, "dur": 0.591, "args": { "External id": 21565,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597253.188, "dur": 0.705, "args": { "External id": 21566,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597254.726, "dur": 0.602, "args": { "External id": 21567,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597256.595, "dur": 0.616, "args": { "External id": 21568,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651597258.041, "dur": 1.222, "args": { "External id": 21569,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651597275.019, "dur": 19.814, "args": { "External id": 21570,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4161 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651597349.638, "dur": 114.451, "args": { "External id": 21571,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4162 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651597376.191, "dur": 84.516, "args": { "External id": 21572,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4163, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651597385.795, "dur": 70.959, "args": { "External id": 21573,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4164 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651597479.145, "dur": 1.972, "args": { "External id": 21574,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4165, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651597559.249, "dur": 1582.788, "args": { "External id": 21575,"Sequence number": 246562, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4166 } }, { "ph": "f", "id": 206, "pid": 1336759, "tid": 1381173, "ts": 1295651597559.249, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651597661.589, "dur": 102.237, "args": { "External id": 21576,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4167 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651597801.258, "dur": 38.552, "args": { "External id": 21577,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651597855.947, "dur": 46.950, "args": { "External id": 21578,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651597912.109, "dur": 31.451, "args": { "External id": 21579,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651597949.914, "dur": 87.893, "args": { "External id": 21580,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651598049.796, "dur": 31.582, "args": { "External id": 21581,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651598089.097, "dur": 43.011, "args": { "External id": 21582,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4173 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651598159.331, "dur": 26.644, "args": { "External id": 21583,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4174 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651598213.730, "dur": 47.916, "args": { "External id": 21584,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4175 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651598286.202, "dur": 21.743, "args": { "External id": 21585,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4176 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651598322.594, "dur": 13.951, "args": { "External id": 21586,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651598345.478, "dur": 32.135, "args": { "External id": 21587,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651598380.800, "dur": 32.277, "args": { "External id": 21588,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4179 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651598439.666, "dur": 160.013, "args": { "External id": 21589,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651598513.483, "dur": 5.965, "args": { "External id": 21590,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651598521.542, "dur": 2.270, "args": { "External id": 21591,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4182 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651598629.168, "dur": 23.935, "args": { "External id": 21592,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4183 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651598666.303, "dur": 13.526, "args": { "External id": 21593,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651598687.338, "dur": 32.293, "args": { "External id": 21594,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651598725.510, "dur": 32.238, "args": { "External id": 21595,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651598764.367, "dur": 19.750, "args": { "External id": 21596,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651598788.899, "dur": 28.377, "args": { "External id": 21597,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651598823.429, "dur": 19.230, "args": { "External id": 21598,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651598848.224, "dur": 28.403, "args": { "External id": 21599,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4190 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651598894.406, "dur": 20.871, "args": { "External id": 21600,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4191 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651598931.666, "dur": 33.041, "args": { "External id": 21601,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4192 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651599025.304, "dur": 25.585, "args": { "External id": 21602,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4193 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651599070.030, "dur": 14.520, "args": { "External id": 21603,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4194 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651599098.128, "dur": 15.740, "args": { "External id": 21604,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4195 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599186.876, "dur": 15.032, "args": { "External id": 21605,"Record function id": 0, "Ev Idx": 4196 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599190.027, "dur": 10.829, "args": { "External id": 21606,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599194.445, "dur": 5.469, "args": { "External id": 21607,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4198 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599195.627, "dur": 4.164, "args": { "External id": 21608,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4199 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599205.705, "dur": 8.645, "args": { "External id": 21609,"Record function id": 0, "Ev Idx": 4200 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599207.308, "dur": 6.612, "args": { "External id": 21610,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599211.635, "dur": 1.834, "args": { "External id": 21611,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4202 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599211.947, "dur": 1.424, "args": { "External id": 21612,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4203 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599217.639, "dur": 4.257, "args": { "External id": 21613,"Record function id": 0, "Ev Idx": 4204 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599218.908, "dur": 2.577, "args": { "External id": 21614,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599219.448, "dur": 1.603, "args": { "External id": 21615,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4206 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599220.067, "dur": 0.900, "args": { "External id": 21616,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4207 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599224.960, "dur": 20.077, "args": { "External id": 21617,"Record function id": 0, "Ev Idx": 4208 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599226.300, "dur": 17.663, "args": { "External id": 21618,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599226.900, "dur": 15.983, "args": { "External id": 21619,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4210 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599227.354, "dur": 0.450, "args": { "External id": 21620,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4211 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599250.433, "dur": 5.775, "args": { "External id": 21621,"Record function id": 0, "Ev Idx": 4212 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599251.764, "dur": 4.004, "args": { "External id": 21622,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599252.934, "dur": 2.375, "args": { "External id": 21623,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4214 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599253.563, "dur": 1.665, "args": { "External id": 21624,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4215 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599259.577, "dur": 5.721, "args": { "External id": 21625,"Record function id": 0, "Ev Idx": 4216 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599261.032, "dur": 3.866, "args": { "External id": 21626,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599261.713, "dur": 2.736, "args": { "External id": 21627,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4218 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599263.662, "dur": 0.720, "args": { "External id": 21628,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4219 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599268.515, "dur": 4.442, "args": { "External id": 21629,"Record function id": 0, "Ev Idx": 4220 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599269.629, "dur": 2.922, "args": { "External id": 21630,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599270.627, "dur": 1.498, "args": { "External id": 21631,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4222 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599271.334, "dur": 0.716, "args": { "External id": 21632,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4223 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599276.080, "dur": 3.736, "args": { "External id": 21633,"Record function id": 0, "Ev Idx": 4224 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599277.076, "dur": 2.328, "args": { "External id": 21634,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599277.688, "dur": 1.254, "args": { "External id": 21635,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4226 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599278.108, "dur": 0.769, "args": { "External id": 21636,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4227 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599282.812, "dur": 3.399, "args": { "External id": 21637,"Record function id": 0, "Ev Idx": 4228 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651599283.726, "dur": 2.084, "args": { "External id": 21638,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599284.376, "dur": 1.012, "args": { "External id": 21639,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4230 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651599284.704, "dur": 0.608, "args": { "External id": 21640,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4231 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651599293.178, "dur": 36391.475, "args": { "External id": 21641,"Record function id": 0, "Sequence number": 246561, "Fwd thread id": 1, "Ev Idx": 4232 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651599294.530, "dur": 36381.793, "args": { "External id": 21642,"Sequence number": 246561, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4233 } }, { "ph": "f", "id": 207, "pid": 1336759, "tid": 1381173, "ts": 1295651599294.530, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.10)", "pid": 1336759, "tid": 1381173, "ts": 1295651599325.615, "dur": 40.941, "args": { "External id": 21643,"Record function id": 0, "Ev Idx": 4234 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.10)", "pid": 1336759, "tid": 1381173, "ts": 1295651599374.024, "dur": 60.146, "args": { "External id": 21644,"Record function id": 0, "Ev Idx": 4235 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.10)", "pid": 1336759, "tid": 1381173, "ts": 1295651599439.725, "dur": 36228.703, "args": { "External id": 21645,"Record function id": 0, "Ev Idx": 4236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651599531.002, "dur": 6.884, "args": { "External id": 21646,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651599550.790, "dur": 5.083, "args": { "External id": 21647,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4238 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651599570.442, "dur": 35259.264, "args": { "External id": 21648,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651599583.491, "dur": 35236.642, "args": { "External id": 21649,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651599631.240, "dur": 15.435, "args": { "External id": 21650,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651599652.897, "dur": 35130.837, "args": { "External id": 21651,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651599655.533, "dur": 35127.529, "args": { "External id": 21652,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651599659.441, "dur": 5.987, "args": { "External id": 21653,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651599667.048, "dur": 35112.472, "args": { "External id": 21654,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651634925.411, "dur": 9.312, "args": { "External id": 21655,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651634928.438, "dur": 5.912, "args": { "External id": 21656,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4247 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651634964.364, "dur": 419.237, "args": { "External id": 21657,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4248 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651635015.744, "dur": 362.401, "args": { "External id": 21658,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4249, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651635029.423, "dur": 342.735, "args": { "External id": 21659,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4250 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651635407.158, "dur": 2.222, "args": { "External id": 21660,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4251, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651635472.383, "dur": 6.895, "args": { "External id": 21661,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651635523.397, "dur": 1.587, "args": { "External id": 21662,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651635539.591, "dur": 1.601, "args": { "External id": 21663,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651635551.485, "dur": 0.719, "args": { "External id": 21664,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651635564.144, "dur": 1.163, "args": { "External id": 21665,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651635574.767, "dur": 1.108, "args": { "External id": 21666,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651635585.142, "dur": 0.983, "args": { "External id": 21667,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651635596.346, "dur": 1.265, "args": { "External id": 21668,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651635606.222, "dur": 1.314, "args": { "External id": 21669,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4260 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651635698.531, "dur": 2583.268, "args": { "External id": 21670,"Record function id": 0, "Ev Idx": 4261 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.9)", "pid": 1336759, "tid": 1381173, "ts": 1295651635716.399, "dur": 966.546, "args": { "External id": 21671,"Record function id": 0, "Ev Idx": 4262 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.9)", "pid": 1336759, "tid": 1381173, "ts": 1295651635730.421, "dur": 339.994, "args": { "External id": 21672,"Record function id": 0, "Ev Idx": 4263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651635801.075, "dur": 3.985, "args": { "External id": 21673,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651635809.250, "dur": 1.619, "args": { "External id": 21674,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651635812.565, "dur": 0.795, "args": { "External id": 21675,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651635814.673, "dur": 1.113, "args": { "External id": 21676,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651635817.304, "dur": 1.360, "args": { "External id": 21677,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651635821.633, "dur": 1.146, "args": { "External id": 21678,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651635824.209, "dur": 1.448, "args": { "External id": 21679,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651635827.204, "dur": 0.873, "args": { "External id": 21680,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651635829.197, "dur": 1.552, "args": { "External id": 21681,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651635833.593, "dur": 1.264, "args": { "External id": 21682,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4273 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651635853.096, "dur": 184.831, "args": { "External id": 21683,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651635868.430, "dur": 164.113, "args": { "External id": 21684,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651635884.676, "dur": 12.165, "args": { "External id": 21685,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651635900.092, "dur": 65.794, "args": { "External id": 21686,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651635902.757, "dur": 62.805, "args": { "External id": 21687,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651635906.659, "dur": 5.442, "args": { "External id": 21688,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651635915.977, "dur": 49.048, "args": { "External id": 21689,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4280 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.8", "pid": 1336759, "tid": 1381173, "ts": 1295651636149.360, "dur": 526.082, "args": { "External id": 21690,"Record function id": 0, "Ev Idx": 4281 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.8)", "pid": 1336759, "tid": 1381173, "ts": 1295651636164.926, "dur": 498.934, "args": { "External id": 21691,"Record function id": 0, "Ev Idx": 4282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651636219.019, "dur": 5.908, "args": { "External id": 21692,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651636256.641, "dur": 23.920, "args": { "External id": 21693,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636261.393, "dur": 1.891, "args": { "External id": 21694,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636265.118, "dur": 0.498, "args": { "External id": 21695,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636267.297, "dur": 0.408, "args": { "External id": 21696,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636268.671, "dur": 0.195, "args": { "External id": 21697,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636270.751, "dur": 0.616, "args": { "External id": 21698,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636272.291, "dur": 0.169, "args": { "External id": 21699,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636273.832, "dur": 0.629, "args": { "External id": 21700,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636275.191, "dur": 0.396, "args": { "External id": 21701,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636276.665, "dur": 0.598, "args": { "External id": 21702,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651636290.956, "dur": 31.148, "args": { "External id": 21703,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4294 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651636352.042, "dur": 93.087, "args": { "External id": 21704,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651636362.821, "dur": 4.135, "args": { "External id": 21705,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651636372.112, "dur": 10.032, "args": { "External id": 21706,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651636376.421, "dur": 5.308, "args": { "External id": 21707,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636379.530, "dur": 0.556, "args": { "External id": 21708,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651636389.265, "dur": 21.835, "args": { "External id": 21709,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636391.246, "dur": 0.856, "args": { "External id": 21710,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636393.277, "dur": 0.841, "args": { "External id": 21711,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636395.340, "dur": 0.550, "args": { "External id": 21712,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636396.464, "dur": 0.882, "args": { "External id": 21713,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636398.303, "dur": 0.601, "args": { "External id": 21714,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636399.457, "dur": 0.675, "args": { "External id": 21715,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636401.421, "dur": 0.393, "args": { "External id": 21716,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636402.796, "dur": 0.651, "args": { "External id": 21717,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651636404.674, "dur": 0.361, "args": { "External id": 21718,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651636420.493, "dur": 17.615, "args": { "External id": 21719,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4310 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651636488.251, "dur": 108.862, "args": { "External id": 21720,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4311 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651636512.061, "dur": 81.848, "args": { "External id": 21721,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4312, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651636522.695, "dur": 67.219, "args": { "External id": 21722,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4313 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651636612.839, "dur": 1.890, "args": { "External id": 21723,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4314, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651636693.142, "dur": 1564.755, "args": { "External id": 21724,"Sequence number": 246560, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4315 } }, { "ph": "f", "id": 208, "pid": 1336759, "tid": 1381173, "ts": 1295651636693.142, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651636794.702, "dur": 108.940, "args": { "External id": 21725,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4316 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651636940.618, "dur": 35.663, "args": { "External id": 21726,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651637036.697, "dur": 54.843, "args": { "External id": 21727,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651637101.398, "dur": 32.101, "args": { "External id": 21728,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651637139.914, "dur": 44.382, "args": { "External id": 21729,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651637191.596, "dur": 27.006, "args": { "External id": 21730,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651637224.969, "dur": 59.848, "args": { "External id": 21731,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4322 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651637313.352, "dur": 20.969, "args": { "External id": 21732,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4323 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651637351.764, "dur": 25.908, "args": { "External id": 21733,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4324 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651637398.764, "dur": 18.080, "args": { "External id": 21734,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4325 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651637430.610, "dur": 13.828, "args": { "External id": 21735,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651637452.903, "dur": 28.146, "args": { "External id": 21736,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651637483.920, "dur": 31.450, "args": { "External id": 21737,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4328 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651637540.405, "dur": 160.719, "args": { "External id": 21738,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651637614.425, "dur": 5.632, "args": { "External id": 21739,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651637622.046, "dur": 2.233, "args": { "External id": 21740,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4331 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651637729.838, "dur": 22.535, "args": { "External id": 21741,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4332 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651637765.358, "dur": 13.040, "args": { "External id": 21742,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651637785.403, "dur": 31.047, "args": { "External id": 21743,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651637821.563, "dur": 33.068, "args": { "External id": 21744,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651637861.349, "dur": 20.322, "args": { "External id": 21745,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651637890.394, "dur": 29.052, "args": { "External id": 21746,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651637925.541, "dur": 19.595, "args": { "External id": 21747,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651637951.487, "dur": 28.627, "args": { "External id": 21748,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4339 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651638039.517, "dur": 23.627, "args": { "External id": 21749,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4340 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651638080.945, "dur": 20.939, "args": { "External id": 21750,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4341 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651638117.707, "dur": 16.320, "args": { "External id": 21751,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4342 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651638148.637, "dur": 24.088, "args": { "External id": 21752,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4343 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651638193.532, "dur": 18.404, "args": { "External id": 21753,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4344 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638304.809, "dur": 15.802, "args": { "External id": 21754,"Record function id": 0, "Ev Idx": 4345 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638308.098, "dur": 11.545, "args": { "External id": 21755,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638312.450, "dur": 6.304, "args": { "External id": 21756,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4347 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638313.936, "dur": 4.673, "args": { "External id": 21757,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4348 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638324.626, "dur": 8.236, "args": { "External id": 21758,"Record function id": 0, "Ev Idx": 4349 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638325.767, "dur": 6.665, "args": { "External id": 21759,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638330.582, "dur": 1.376, "args": { "External id": 21760,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4351 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638330.988, "dur": 0.862, "args": { "External id": 21761,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4352 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638336.086, "dur": 4.081, "args": { "External id": 21762,"Record function id": 0, "Ev Idx": 4353 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638337.321, "dur": 2.393, "args": { "External id": 21763,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638337.945, "dur": 1.336, "args": { "External id": 21764,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4355 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638338.461, "dur": 0.726, "args": { "External id": 21765,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4356 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638343.387, "dur": 3.147, "args": { "External id": 21766,"Record function id": 0, "Ev Idx": 4357 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638344.334, "dur": 1.790, "args": { "External id": 21767,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638344.891, "dur": 0.815, "args": { "External id": 21768,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4359 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638345.163, "dur": 0.451, "args": { "External id": 21769,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4360 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638349.587, "dur": 3.439, "args": { "External id": 21770,"Record function id": 0, "Ev Idx": 4361 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638350.536, "dur": 2.067, "args": { "External id": 21771,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638351.009, "dur": 1.138, "args": { "External id": 21772,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4363 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638351.354, "dur": 0.728, "args": { "External id": 21773,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4364 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638356.027, "dur": 3.383, "args": { "External id": 21774,"Record function id": 0, "Ev Idx": 4365 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638356.906, "dur": 2.086, "args": { "External id": 21775,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638357.479, "dur": 1.057, "args": { "External id": 21776,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4367 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638357.914, "dur": 0.555, "args": { "External id": 21777,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4368 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638362.542, "dur": 3.064, "args": { "External id": 21778,"Record function id": 0, "Ev Idx": 4369 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638363.447, "dur": 1.734, "args": { "External id": 21779,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638363.943, "dur": 0.818, "args": { "External id": 21780,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4371 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638364.223, "dur": 0.467, "args": { "External id": 21781,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4372 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638368.687, "dur": 2.945, "args": { "External id": 21782,"Record function id": 0, "Ev Idx": 4373 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638369.633, "dur": 1.601, "args": { "External id": 21783,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638370.069, "dur": 0.764, "args": { "External id": 21784,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4375 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638370.321, "dur": 0.438, "args": { "External id": 21785,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4376 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638374.661, "dur": 5.144, "args": { "External id": 21786,"Record function id": 0, "Ev Idx": 4377 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651638375.862, "dur": 3.541, "args": { "External id": 21787,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638376.377, "dur": 2.590, "args": { "External id": 21788,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4379 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651638378.198, "dur": 0.704, "args": { "External id": 21789,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4380 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651638383.511, "dur": 36169.055, "args": { "External id": 21790,"Record function id": 0, "Sequence number": 246559, "Fwd thread id": 1, "Ev Idx": 4381 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651638384.588, "dur": 36159.723, "args": { "External id": 21791,"Sequence number": 246559, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4382 } }, { "ph": "f", "id": 209, "pid": 1336759, "tid": 1381173, "ts": 1295651638384.588, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.9)", "pid": 1336759, "tid": 1381173, "ts": 1295651638412.842, "dur": 37.966, "args": { "External id": 21792,"Record function id": 0, "Ev Idx": 4383 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.9)", "pid": 1336759, "tid": 1381173, "ts": 1295651638458.634, "dur": 63.199, "args": { "External id": 21793,"Record function id": 0, "Ev Idx": 4384 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.9)", "pid": 1336759, "tid": 1381173, "ts": 1295651638527.357, "dur": 36009.300, "args": { "External id": 21794,"Record function id": 0, "Ev Idx": 4385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651638621.509, "dur": 6.479, "args": { "External id": 21795,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651638637.177, "dur": 4.822, "args": { "External id": 21796,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4387 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651638659.566, "dur": 35068.607, "args": { "External id": 21797,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651638674.053, "dur": 35044.309, "args": { "External id": 21798,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651638724.748, "dur": 15.936, "args": { "External id": 21799,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651638747.093, "dur": 34932.601, "args": { "External id": 21800,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651638749.740, "dur": 34929.199, "args": { "External id": 21801,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651638753.730, "dur": 5.128, "args": { "External id": 21802,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651638760.527, "dur": 34914.764, "args": { "External id": 21803,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651673823.518, "dur": 10.032, "args": { "External id": 21804,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651673826.441, "dur": 6.675, "args": { "External id": 21805,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4396 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651673861.310, "dur": 393.668, "args": { "External id": 21806,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4397 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651673890.825, "dur": 358.751, "args": { "External id": 21807,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4398, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651673901.616, "dur": 340.328, "args": { "External id": 21808,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4399 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651674279.486, "dur": 2.450, "args": { "External id": 21809,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4400, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651674343.668, "dur": 7.325, "args": { "External id": 21810,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651674393.447, "dur": 1.441, "args": { "External id": 21811,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651674409.730, "dur": 1.412, "args": { "External id": 21812,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651674421.680, "dur": 0.757, "args": { "External id": 21813,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651674432.516, "dur": 1.044, "args": { "External id": 21814,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651674442.898, "dur": 0.868, "args": { "External id": 21815,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651674453.711, "dur": 0.997, "args": { "External id": 21816,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651674464.450, "dur": 1.478, "args": { "External id": 21817,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651674474.464, "dur": 1.189, "args": { "External id": 21818,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4409 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651674566.801, "dur": 2624.220, "args": { "External id": 21819,"Record function id": 0, "Ev Idx": 4410 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.8)", "pid": 1336759, "tid": 1381173, "ts": 1295651674585.976, "dur": 987.817, "args": { "External id": 21820,"Record function id": 0, "Ev Idx": 4411 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.8)", "pid": 1336759, "tid": 1381173, "ts": 1295651674600.226, "dur": 294.903, "args": { "External id": 21821,"Record function id": 0, "Ev Idx": 4412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651674673.912, "dur": 4.611, "args": { "External id": 21822,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651674683.448, "dur": 0.898, "args": { "External id": 21823,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651674686.016, "dur": 1.050, "args": { "External id": 21824,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651674688.380, "dur": 0.891, "args": { "External id": 21825,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651674690.691, "dur": 1.892, "args": { "External id": 21826,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651674695.912, "dur": 1.025, "args": { "External id": 21827,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651674698.371, "dur": 1.155, "args": { "External id": 21828,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651674700.673, "dur": 1.002, "args": { "External id": 21829,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651674702.790, "dur": 1.234, "args": { "External id": 21830,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651674707.268, "dur": 0.753, "args": { "External id": 21831,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4422 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651674725.348, "dur": 142.227, "args": { "External id": 21832,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651674741.329, "dur": 122.073, "args": { "External id": 21833,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651674757.447, "dur": 12.422, "args": { "External id": 21834,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651674772.893, "dur": 64.699, "args": { "External id": 21835,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651674775.273, "dur": 61.913, "args": { "External id": 21836,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651674779.103, "dur": 4.770, "args": { "External id": 21837,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651674785.601, "dur": 51.117, "args": { "External id": 21838,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4429 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.7", "pid": 1336759, "tid": 1381173, "ts": 1295651674970.923, "dur": 595.854, "args": { "External id": 21839,"Record function id": 0, "Ev Idx": 4430 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.7)", "pid": 1336759, "tid": 1381173, "ts": 1295651675029.313, "dur": 524.907, "args": { "External id": 21840,"Record function id": 0, "Ev Idx": 4431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651675088.194, "dur": 6.313, "args": { "External id": 21841,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651675110.495, "dur": 22.239, "args": { "External id": 21842,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675115.069, "dur": 1.721, "args": { "External id": 21843,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675118.380, "dur": 0.375, "args": { "External id": 21844,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675119.745, "dur": 0.808, "args": { "External id": 21845,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675121.799, "dur": 0.276, "args": { "External id": 21846,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675122.798, "dur": 0.922, "args": { "External id": 21847,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675125.007, "dur": 0.265, "args": { "External id": 21848,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675125.919, "dur": 0.468, "args": { "External id": 21849,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675127.571, "dur": 0.461, "args": { "External id": 21850,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675129.041, "dur": 0.309, "args": { "External id": 21851,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651675142.032, "dur": 35.089, "args": { "External id": 21852,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4443 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651675207.119, "dur": 111.359, "args": { "External id": 21853,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651675216.456, "dur": 2.951, "args": { "External id": 21854,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651675224.084, "dur": 27.115, "args": { "External id": 21855,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651675243.888, "dur": 6.888, "args": { "External id": 21856,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675248.010, "dur": 0.808, "args": { "External id": 21857,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651675259.167, "dur": 20.220, "args": { "External id": 21858,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675260.502, "dur": 0.272, "args": { "External id": 21859,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675261.967, "dur": 0.700, "args": { "External id": 21860,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675263.932, "dur": 0.282, "args": { "External id": 21861,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675264.798, "dur": 0.567, "args": { "External id": 21862,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675266.307, "dur": 0.330, "args": { "External id": 21863,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675267.964, "dur": 0.770, "args": { "External id": 21864,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675270.020, "dur": 0.631, "args": { "External id": 21865,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675271.784, "dur": 0.797, "args": { "External id": 21866,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651675273.759, "dur": 0.270, "args": { "External id": 21867,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651675291.649, "dur": 19.343, "args": { "External id": 21868,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4459 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651675363.926, "dur": 119.769, "args": { "External id": 21869,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4460 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651675394.033, "dur": 86.116, "args": { "External id": 21870,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4461, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651675404.500, "dur": 71.559, "args": { "External id": 21871,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4462 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651675502.037, "dur": 1.984, "args": { "External id": 21872,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4463, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651675580.301, "dur": 1589.506, "args": { "External id": 21873,"Sequence number": 246558, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4464 } }, { "ph": "f", "id": 210, "pid": 1336759, "tid": 1381173, "ts": 1295651675580.301, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651675682.197, "dur": 102.364, "args": { "External id": 21874,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4465 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651675821.871, "dur": 37.176, "args": { "External id": 21875,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651675874.335, "dur": 47.369, "args": { "External id": 21876,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651675930.555, "dur": 31.954, "args": { "External id": 21877,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651675969.092, "dur": 87.746, "args": { "External id": 21878,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651676068.491, "dur": 30.968, "args": { "External id": 21879,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651676107.273, "dur": 42.166, "args": { "External id": 21880,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4471 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651676176.375, "dur": 21.872, "args": { "External id": 21881,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4472 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651676216.530, "dur": 42.422, "args": { "External id": 21882,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4473 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651676283.789, "dur": 19.279, "args": { "External id": 21883,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4474 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651676316.567, "dur": 13.572, "args": { "External id": 21884,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651676338.540, "dur": 30.682, "args": { "External id": 21885,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651676372.302, "dur": 32.325, "args": { "External id": 21886,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4477 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651676430.811, "dur": 169.188, "args": { "External id": 21887,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651676508.010, "dur": 6.264, "args": { "External id": 21888,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651676519.363, "dur": 2.311, "args": { "External id": 21889,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4480 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651676631.738, "dur": 25.527, "args": { "External id": 21890,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4481 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651676668.837, "dur": 14.148, "args": { "External id": 21891,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651676691.220, "dur": 39.758, "args": { "External id": 21892,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651676736.956, "dur": 33.879, "args": { "External id": 21893,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651676777.635, "dur": 20.081, "args": { "External id": 21894,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651676802.132, "dur": 28.949, "args": { "External id": 21895,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651676837.116, "dur": 19.056, "args": { "External id": 21896,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651676861.857, "dur": 28.758, "args": { "External id": 21897,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4488 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651676909.465, "dur": 21.707, "args": { "External id": 21898,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4489 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651676950.400, "dur": 21.320, "args": { "External id": 21899,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4490 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651677025.974, "dur": 31.171, "args": { "External id": 21900,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4491 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651677092.236, "dur": 16.669, "args": { "External id": 21901,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4492 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651677122.224, "dur": 19.460, "args": { "External id": 21902,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4493 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677213.585, "dur": 33.770, "args": { "External id": 21903,"Record function id": 0, "Ev Idx": 4494 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677216.816, "dur": 10.804, "args": { "External id": 21904,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677221.193, "dur": 5.580, "args": { "External id": 21905,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4496 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677222.657, "dur": 4.022, "args": { "External id": 21906,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4497 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677254.401, "dur": 6.546, "args": { "External id": 21907,"Record function id": 0, "Ev Idx": 4498 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677256.045, "dur": 4.404, "args": { "External id": 21908,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677257.347, "dur": 2.303, "args": { "External id": 21909,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4500 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677258.025, "dur": 1.547, "args": { "External id": 21910,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4501 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677264.267, "dur": 4.607, "args": { "External id": 21911,"Record function id": 0, "Ev Idx": 4502 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677265.426, "dur": 3.025, "args": { "External id": 21912,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677266.034, "dur": 1.996, "args": { "External id": 21913,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4504 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677266.803, "dur": 1.117, "args": { "External id": 21914,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4505 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677271.987, "dur": 3.562, "args": { "External id": 21915,"Record function id": 0, "Ev Idx": 4506 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677273.074, "dur": 2.021, "args": { "External id": 21916,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677273.629, "dur": 1.031, "args": { "External id": 21917,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4508 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677273.925, "dur": 0.642, "args": { "External id": 21918,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4509 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677278.538, "dur": 3.445, "args": { "External id": 21919,"Record function id": 0, "Ev Idx": 4510 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677279.503, "dur": 2.063, "args": { "External id": 21920,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677280.027, "dur": 1.119, "args": { "External id": 21921,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4512 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677280.395, "dur": 0.678, "args": { "External id": 21922,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4513 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677284.940, "dur": 5.299, "args": { "External id": 21923,"Record function id": 0, "Ev Idx": 4514 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677285.939, "dur": 3.857, "args": { "External id": 21924,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677286.405, "dur": 2.994, "args": { "External id": 21925,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4516 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677288.685, "dur": 0.601, "args": { "External id": 21926,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4517 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677293.380, "dur": 3.692, "args": { "External id": 21927,"Record function id": 0, "Ev Idx": 4518 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677294.331, "dur": 2.328, "args": { "External id": 21928,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677294.919, "dur": 1.341, "args": { "External id": 21929,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4520 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677295.285, "dur": 0.909, "args": { "External id": 21930,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4521 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677303.155, "dur": 3.942, "args": { "External id": 21931,"Record function id": 0, "Ev Idx": 4522 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677304.218, "dur": 2.446, "args": { "External id": 21932,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677304.776, "dur": 1.473, "args": { "External id": 21933,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4524 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677305.363, "dur": 0.822, "args": { "External id": 21934,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4525 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677310.262, "dur": 3.482, "args": { "External id": 21935,"Record function id": 0, "Ev Idx": 4526 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651677311.305, "dur": 2.031, "args": { "External id": 21936,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677311.783, "dur": 1.078, "args": { "External id": 21937,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4528 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651677312.178, "dur": 0.611, "args": { "External id": 21938,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4529 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651677317.291, "dur": 36795.236, "args": { "External id": 21939,"Record function id": 0, "Sequence number": 246557, "Fwd thread id": 1, "Ev Idx": 4530 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651677318.558, "dur": 36784.920, "args": { "External id": 21940,"Sequence number": 246557, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4531 } }, { "ph": "f", "id": 211, "pid": 1336759, "tid": 1381173, "ts": 1295651677318.558, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.8)", "pid": 1336759, "tid": 1381173, "ts": 1295651677348.356, "dur": 40.025, "args": { "External id": 21941,"Record function id": 0, "Ev Idx": 4532 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.8)", "pid": 1336759, "tid": 1381173, "ts": 1295651677396.989, "dur": 66.642, "args": { "External id": 21942,"Record function id": 0, "Ev Idx": 4533 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.8)", "pid": 1336759, "tid": 1381173, "ts": 1295651677469.023, "dur": 36626.397, "args": { "External id": 21943,"Record function id": 0, "Ev Idx": 4534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651677556.540, "dur": 6.738, "args": { "External id": 21944,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651677572.899, "dur": 4.931, "args": { "External id": 21945,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4536 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651677592.381, "dur": 35679.195, "args": { "External id": 21946,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651677605.638, "dur": 35657.041, "args": { "External id": 21947,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651677655.863, "dur": 16.428, "args": { "External id": 21948,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651677678.636, "dur": 35537.626, "args": { "External id": 21949,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651677681.320, "dur": 35534.301, "args": { "External id": 21950,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651677688.263, "dur": 5.226, "args": { "External id": 21951,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651677695.226, "dur": 35517.092, "args": { "External id": 21952,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651713358.743, "dur": 8.651, "args": { "External id": 21953,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651713361.434, "dur": 5.647, "args": { "External id": 21954,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4545 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651713393.074, "dur": 376.950, "args": { "External id": 21955,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4546 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651713423.160, "dur": 342.400, "args": { "External id": 21956,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4547, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651713433.948, "dur": 326.384, "args": { "External id": 21957,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4548 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651713790.859, "dur": 2.248, "args": { "External id": 21958,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4549, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651713848.266, "dur": 6.700, "args": { "External id": 21959,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651713898.450, "dur": 1.339, "args": { "External id": 21960,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651713914.962, "dur": 1.450, "args": { "External id": 21961,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651713927.505, "dur": 1.072, "args": { "External id": 21962,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651713942.034, "dur": 0.920, "args": { "External id": 21963,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651713953.273, "dur": 0.968, "args": { "External id": 21964,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651713964.502, "dur": 0.955, "args": { "External id": 21965,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651713975.750, "dur": 0.971, "args": { "External id": 21966,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714027.619, "dur": 3.386, "args": { "External id": 21967,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4558 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651714128.231, "dur": 2619.213, "args": { "External id": 21968,"Record function id": 0, "Ev Idx": 4559 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.7)", "pid": 1336759, "tid": 1381173, "ts": 1295651714147.353, "dur": 999.008, "args": { "External id": 21969,"Record function id": 0, "Ev Idx": 4560 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.7)", "pid": 1336759, "tid": 1381173, "ts": 1295651714162.585, "dur": 329.085, "args": { "External id": 21970,"Record function id": 0, "Ev Idx": 4561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651714261.159, "dur": 5.076, "args": { "External id": 21971,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651714269.970, "dur": 0.950, "args": { "External id": 21972,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651714272.772, "dur": 1.116, "args": { "External id": 21973,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651714275.674, "dur": 0.973, "args": { "External id": 21974,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4565 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651714279.642, "dur": 1.087, "args": { "External id": 21975,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651714282.195, "dur": 0.972, "args": { "External id": 21976,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651714284.582, "dur": 1.165, "args": { "External id": 21977,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651714287.069, "dur": 0.746, "args": { "External id": 21978,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651714290.456, "dur": 1.132, "args": { "External id": 21979,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651714292.659, "dur": 0.569, "args": { "External id": 21980,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4571 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651714312.178, "dur": 145.934, "args": { "External id": 21981,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651714327.719, "dur": 125.790, "args": { "External id": 21982,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651714343.990, "dur": 13.024, "args": { "External id": 21983,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651714360.525, "dur": 67.937, "args": { "External id": 21984,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651714363.083, "dur": 65.072, "args": { "External id": 21985,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714366.753, "dur": 5.510, "args": { "External id": 21986,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651714373.951, "dur": 53.506, "args": { "External id": 21987,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4578 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.6", "pid": 1336759, "tid": 1381173, "ts": 1295651714571.323, "dur": 567.918, "args": { "External id": 21988,"Record function id": 0, "Ev Idx": 4579 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.6)", "pid": 1336759, "tid": 1381173, "ts": 1295651714587.134, "dur": 539.820, "args": { "External id": 21989,"Record function id": 0, "Ev Idx": 4580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651714641.188, "dur": 4.531, "args": { "External id": 21990,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651714661.320, "dur": 20.819, "args": { "External id": 21991,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714665.903, "dur": 1.804, "args": { "External id": 21992,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714669.425, "dur": 0.567, "args": { "External id": 21993,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714670.961, "dur": 0.505, "args": { "External id": 21994,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714672.359, "dur": 0.299, "args": { "External id": 21995,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714673.450, "dur": 0.364, "args": { "External id": 21996,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714675.032, "dur": 0.397, "args": { "External id": 21997,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714676.396, "dur": 0.263, "args": { "External id": 21998,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714677.514, "dur": 0.619, "args": { "External id": 21999,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714679.052, "dur": 0.166, "args": { "External id": 22000,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651714690.717, "dur": 26.667, "args": { "External id": 22001,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4592 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651714744.894, "dur": 101.409, "args": { "External id": 22002,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651714753.590, "dur": 2.867, "args": { "External id": 22003,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651714761.094, "dur": 9.795, "args": { "External id": 22004,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651714765.240, "dur": 5.240, "args": { "External id": 22005,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714768.568, "dur": 0.588, "args": { "External id": 22006,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651714776.989, "dur": 19.490, "args": { "External id": 22007,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714778.568, "dur": 0.480, "args": { "External id": 22008,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714780.054, "dur": 0.195, "args": { "External id": 22009,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714781.227, "dur": 0.539, "args": { "External id": 22010,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714783.158, "dur": 0.400, "args": { "External id": 22011,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714784.663, "dur": 0.450, "args": { "External id": 22012,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714786.440, "dur": 0.711, "args": { "External id": 22013,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714788.471, "dur": 0.643, "args": { "External id": 22014,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714789.653, "dur": 0.364, "args": { "External id": 22015,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651714791.453, "dur": 0.484, "args": { "External id": 22016,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651714821.225, "dur": 17.076, "args": { "External id": 22017,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4608 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651714888.928, "dur": 160.689, "args": { "External id": 22018,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4609 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651714916.832, "dur": 128.687, "args": { "External id": 22019,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4610, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651714926.138, "dur": 114.792, "args": { "External id": 22020,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4611 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651715068.294, "dur": 1.866, "args": { "External id": 22021,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4612, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651715154.107, "dur": 1571.489, "args": { "External id": 22022,"Sequence number": 246556, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4613 } }, { "ph": "f", "id": 212, "pid": 1336759, "tid": 1381173, "ts": 1295651715154.107, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651715285.745, "dur": 106.834, "args": { "External id": 22023,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4614 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651715431.629, "dur": 37.697, "args": { "External id": 22024,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651715484.529, "dur": 46.718, "args": { "External id": 22025,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651715540.630, "dur": 31.272, "args": { "External id": 22026,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651715581.795, "dur": 44.223, "args": { "External id": 22027,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651715632.883, "dur": 27.080, "args": { "External id": 22028,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651715666.521, "dur": 41.580, "args": { "External id": 22029,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4620 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651715733.024, "dur": 20.184, "args": { "External id": 22030,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4621 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651715771.258, "dur": 26.052, "args": { "External id": 22031,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4622 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651715817.688, "dur": 17.554, "args": { "External id": 22032,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4623 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651715848.434, "dur": 13.289, "args": { "External id": 22033,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651715869.892, "dur": 26.904, "args": { "External id": 22034,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651715899.980, "dur": 31.682, "args": { "External id": 22035,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4626 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651715956.138, "dur": 225.448, "args": { "External id": 22036,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651716088.061, "dur": 7.492, "args": { "External id": 22037,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651716097.566, "dur": 2.060, "args": { "External id": 22038,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4629 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651716212.679, "dur": 41.777, "args": { "External id": 22039,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4630 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651716267.543, "dur": 15.443, "args": { "External id": 22040,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651716292.531, "dur": 43.122, "args": { "External id": 22041,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651716341.571, "dur": 37.815, "args": { "External id": 22042,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651716386.152, "dur": 19.757, "args": { "External id": 22043,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651716409.948, "dur": 32.167, "args": { "External id": 22044,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651716447.385, "dur": 19.331, "args": { "External id": 22045,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651716472.737, "dur": 28.422, "args": { "External id": 22046,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4637 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651716520.728, "dur": 21.142, "args": { "External id": 22047,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4638 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651716558.276, "dur": 37.919, "args": { "External id": 22048,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4639 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651716619.473, "dur": 19.540, "args": { "External id": 22049,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4640 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651716653.901, "dur": 14.196, "args": { "External id": 22050,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4641 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651716680.864, "dur": 17.282, "args": { "External id": 22051,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4642 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716769.645, "dur": 14.100, "args": { "External id": 22052,"Record function id": 0, "Ev Idx": 4643 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716772.625, "dur": 10.089, "args": { "External id": 22053,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716776.510, "dur": 5.349, "args": { "External id": 22054,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4645 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716777.717, "dur": 4.044, "args": { "External id": 22055,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4646 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716787.543, "dur": 4.463, "args": { "External id": 22056,"Record function id": 0, "Ev Idx": 4647 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716788.709, "dur": 2.876, "args": { "External id": 22057,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716789.574, "dur": 1.550, "args": { "External id": 22058,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4649 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716790.201, "dur": 0.852, "args": { "External id": 22059,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4650 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716795.239, "dur": 3.608, "args": { "External id": 22060,"Record function id": 0, "Ev Idx": 4651 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716796.187, "dur": 2.242, "args": { "External id": 22061,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716796.651, "dur": 1.348, "args": { "External id": 22062,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4653 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716797.258, "dur": 0.645, "args": { "External id": 22063,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4654 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716801.995, "dur": 3.630, "args": { "External id": 22064,"Record function id": 0, "Ev Idx": 4655 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716802.922, "dur": 2.288, "args": { "External id": 22065,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716803.456, "dur": 1.306, "args": { "External id": 22066,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4657 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716803.975, "dur": 0.683, "args": { "External id": 22067,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4658 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716808.639, "dur": 3.600, "args": { "External id": 22068,"Record function id": 0, "Ev Idx": 4659 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716809.673, "dur": 2.116, "args": { "External id": 22069,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716810.211, "dur": 1.130, "args": { "External id": 22070,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4661 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716810.464, "dur": 0.811, "args": { "External id": 22071,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4662 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716815.248, "dur": 6.580, "args": { "External id": 22072,"Record function id": 0, "Ev Idx": 4663 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716816.223, "dur": 5.201, "args": { "External id": 22073,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716816.691, "dur": 4.297, "args": { "External id": 22074,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4665 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716817.174, "dur": 3.744, "args": { "External id": 22075,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4666 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716824.925, "dur": 5.094, "args": { "External id": 22076,"Record function id": 0, "Ev Idx": 4667 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716825.809, "dur": 3.773, "args": { "External id": 22077,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716826.311, "dur": 2.842, "args": { "External id": 22078,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4669 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716828.439, "dur": 0.621, "args": { "External id": 22079,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4670 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716832.989, "dur": 3.176, "args": { "External id": 22080,"Record function id": 0, "Ev Idx": 4671 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716833.957, "dur": 1.806, "args": { "External id": 22081,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716834.435, "dur": 0.869, "args": { "External id": 22082,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4673 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716834.704, "dur": 0.519, "args": { "External id": 22083,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4674 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716839.085, "dur": 3.395, "args": { "External id": 22084,"Record function id": 0, "Ev Idx": 4675 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651716839.951, "dur": 2.116, "args": { "External id": 22085,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716840.524, "dur": 1.104, "args": { "External id": 22086,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4677 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651716840.974, "dur": 0.589, "args": { "External id": 22087,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4678 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651716846.147, "dur": 35860.722, "args": { "External id": 22088,"Record function id": 0, "Sequence number": 246555, "Fwd thread id": 1, "Ev Idx": 4679 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651716847.356, "dur": 35851.351, "args": { "External id": 22089,"Sequence number": 246555, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4680 } }, { "ph": "f", "id": 213, "pid": 1336759, "tid": 1381173, "ts": 1295651716847.356, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.7)", "pid": 1336759, "tid": 1381173, "ts": 1295651716874.393, "dur": 39.764, "args": { "External id": 22090,"Record function id": 0, "Ev Idx": 4681 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.7)", "pid": 1336759, "tid": 1381173, "ts": 1295651716921.297, "dur": 101.018, "args": { "External id": 22091,"Record function id": 0, "Ev Idx": 4682 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.7)", "pid": 1336759, "tid": 1381173, "ts": 1295651717031.712, "dur": 35659.286, "args": { "External id": 22092,"Record function id": 0, "Ev Idx": 4683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651717127.387, "dur": 7.082, "args": { "External id": 22093,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651717145.184, "dur": 5.135, "args": { "External id": 22094,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4685 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651717167.904, "dur": 34694.366, "args": { "External id": 22095,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651717180.565, "dur": 34669.940, "args": { "External id": 22096,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651717245.395, "dur": 15.328, "args": { "External id": 22097,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651717267.467, "dur": 34546.225, "args": { "External id": 22098,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651717270.327, "dur": 34542.693, "args": { "External id": 22099,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651717274.000, "dur": 6.086, "args": { "External id": 22100,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651717283.831, "dur": 34525.794, "args": { "External id": 22101,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651751952.499, "dur": 9.477, "args": { "External id": 22102,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651751955.244, "dur": 6.355, "args": { "External id": 22103,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4694 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651752013.198, "dur": 401.867, "args": { "External id": 22104,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4695 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651752044.021, "dur": 366.021, "args": { "External id": 22105,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4696, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651752055.301, "dur": 349.006, "args": { "External id": 22106,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4697 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651752436.112, "dur": 2.002, "args": { "External id": 22107,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4698, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651752499.831, "dur": 6.800, "args": { "External id": 22108,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651752550.990, "dur": 1.440, "args": { "External id": 22109,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651752566.905, "dur": 1.253, "args": { "External id": 22110,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651752579.195, "dur": 1.123, "args": { "External id": 22111,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651752590.302, "dur": 1.061, "args": { "External id": 22112,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651752599.950, "dur": 0.789, "args": { "External id": 22113,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651752609.999, "dur": 0.885, "args": { "External id": 22114,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651752622.488, "dur": 1.399, "args": { "External id": 22115,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651752632.068, "dur": 0.781, "args": { "External id": 22116,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4707 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651752721.151, "dur": 2635.814, "args": { "External id": 22117,"Record function id": 0, "Ev Idx": 4708 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.6)", "pid": 1336759, "tid": 1381173, "ts": 1295651752739.245, "dur": 997.948, "args": { "External id": 22118,"Record function id": 0, "Ev Idx": 4709 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.6)", "pid": 1336759, "tid": 1381173, "ts": 1295651752754.391, "dur": 355.812, "args": { "External id": 22119,"Record function id": 0, "Ev Idx": 4710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651752823.343, "dur": 4.548, "args": { "External id": 22120,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651752831.050, "dur": 1.793, "args": { "External id": 22121,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651752834.623, "dur": 0.860, "args": { "External id": 22122,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651752838.245, "dur": 1.238, "args": { "External id": 22123,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651752841.189, "dur": 1.044, "args": { "External id": 22124,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651752843.717, "dur": 0.574, "args": { "External id": 22125,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651752845.628, "dur": 0.941, "args": { "External id": 22126,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651752849.179, "dur": 1.098, "args": { "External id": 22127,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4718 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651752851.382, "dur": 1.435, "args": { "External id": 22128,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651752854.007, "dur": 0.933, "args": { "External id": 22129,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4720 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651752872.190, "dur": 204.704, "args": { "External id": 22130,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651752887.613, "dur": 184.260, "args": { "External id": 22131,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651752913.832, "dur": 12.569, "args": { "External id": 22132,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651752929.543, "dur": 108.723, "args": { "External id": 22133,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651752932.108, "dur": 105.852, "args": { "External id": 22134,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651752937.989, "dur": 5.383, "args": { "External id": 22135,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651752945.285, "dur": 91.517, "args": { "External id": 22136,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4727 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.5", "pid": 1336759, "tid": 1381173, "ts": 1295651753193.036, "dur": 536.203, "args": { "External id": 22137,"Record function id": 0, "Ev Idx": 4728 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.5)", "pid": 1336759, "tid": 1381173, "ts": 1295651753209.828, "dur": 505.121, "args": { "External id": 22138,"Record function id": 0, "Ev Idx": 4729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651753284.049, "dur": 6.483, "args": { "External id": 22139,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651753306.999, "dur": 22.429, "args": { "External id": 22140,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753312.003, "dur": 1.522, "args": { "External id": 22141,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753315.280, "dur": 0.484, "args": { "External id": 22142,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753317.754, "dur": 0.872, "args": { "External id": 22143,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753319.476, "dur": 0.253, "args": { "External id": 22144,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753320.579, "dur": 0.696, "args": { "External id": 22145,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753321.891, "dur": 0.285, "args": { "External id": 22146,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753322.789, "dur": 0.421, "args": { "External id": 22147,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753324.209, "dur": 0.746, "args": { "External id": 22148,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753325.858, "dur": 0.398, "args": { "External id": 22149,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651753339.115, "dur": 30.498, "args": { "External id": 22150,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4741 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651753399.846, "dur": 97.444, "args": { "External id": 22151,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651753409.746, "dur": 3.120, "args": { "External id": 22152,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651753417.830, "dur": 9.604, "args": { "External id": 22153,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651753422.008, "dur": 5.020, "args": { "External id": 22154,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753425.195, "dur": 0.602, "args": { "External id": 22155,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651753433.741, "dur": 20.956, "args": { "External id": 22156,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753435.113, "dur": 0.349, "args": { "External id": 22157,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753436.821, "dur": 0.581, "args": { "External id": 22158,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753441.449, "dur": 0.388, "args": { "External id": 22159,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753442.752, "dur": 0.675, "args": { "External id": 22160,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753444.416, "dur": 0.890, "args": { "External id": 22161,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753446.252, "dur": 0.452, "args": { "External id": 22162,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753447.252, "dur": 0.170, "args": { "External id": 22163,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753448.892, "dur": 0.400, "args": { "External id": 22164,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651753450.050, "dur": 0.338, "args": { "External id": 22165,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651753469.354, "dur": 20.585, "args": { "External id": 22166,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4757 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651753540.534, "dur": 109.606, "args": { "External id": 22167,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4758 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651753565.968, "dur": 80.683, "args": { "External id": 22168,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4759, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651753575.457, "dur": 67.347, "args": { "External id": 22169,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4760 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651753666.076, "dur": 1.601, "args": { "External id": 22170,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4761, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651753743.419, "dur": 1594.739, "args": { "External id": 22171,"Sequence number": 246554, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4762 } }, { "ph": "f", "id": 214, "pid": 1336759, "tid": 1381173, "ts": 1295651753743.419, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651753852.299, "dur": 109.080, "args": { "External id": 22172,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4763 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651754041.521, "dur": 40.068, "args": { "External id": 22173,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651754100.243, "dur": 55.714, "args": { "External id": 22174,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651754166.212, "dur": 33.055, "args": { "External id": 22175,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651754205.977, "dur": 55.399, "args": { "External id": 22176,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651754271.860, "dur": 30.276, "args": { "External id": 22177,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651754309.588, "dur": 41.489, "args": { "External id": 22178,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4769 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651754377.522, "dur": 22.607, "args": { "External id": 22179,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4770 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651754417.500, "dur": 25.580, "args": { "External id": 22180,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4771 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651754463.061, "dur": 18.003, "args": { "External id": 22181,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4772 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651754494.154, "dur": 13.527, "args": { "External id": 22182,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651754515.569, "dur": 26.887, "args": { "External id": 22183,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651754545.934, "dur": 30.674, "args": { "External id": 22184,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4775 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651754604.724, "dur": 167.225, "args": { "External id": 22185,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651754680.314, "dur": 5.856, "args": { "External id": 22186,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651754691.548, "dur": 1.950, "args": { "External id": 22187,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4778 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651754798.804, "dur": 23.187, "args": { "External id": 22188,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4779 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651754831.603, "dur": 12.898, "args": { "External id": 22189,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651754851.947, "dur": 30.757, "args": { "External id": 22190,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651754888.104, "dur": 34.281, "args": { "External id": 22191,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651754928.331, "dur": 19.773, "args": { "External id": 22192,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651754951.780, "dur": 68.418, "args": { "External id": 22193,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651755030.882, "dur": 24.642, "args": { "External id": 22194,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651755061.830, "dur": 29.166, "args": { "External id": 22195,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4786 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651755110.695, "dur": 22.498, "args": { "External id": 22196,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4787 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651755150.598, "dur": 21.926, "args": { "External id": 22197,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4788 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651755188.097, "dur": 29.073, "args": { "External id": 22198,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4789 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651755256.181, "dur": 17.177, "args": { "External id": 22199,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4790 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651755288.007, "dur": 15.916, "args": { "External id": 22200,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4791 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755382.466, "dur": 14.939, "args": { "External id": 22201,"Record function id": 0, "Ev Idx": 4792 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755386.011, "dur": 10.453, "args": { "External id": 22202,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755390.196, "dur": 5.376, "args": { "External id": 22203,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4794 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755391.374, "dur": 4.066, "args": { "External id": 22204,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4795 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755401.232, "dur": 4.412, "args": { "External id": 22205,"Record function id": 0, "Ev Idx": 4796 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755402.731, "dur": 2.512, "args": { "External id": 22206,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755403.475, "dur": 1.256, "args": { "External id": 22207,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4798 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755403.898, "dur": 0.766, "args": { "External id": 22208,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4799 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755408.827, "dur": 4.363, "args": { "External id": 22209,"Record function id": 0, "Ev Idx": 4800 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755409.821, "dur": 2.955, "args": { "External id": 22210,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755410.423, "dur": 1.869, "args": { "External id": 22211,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4802 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755410.836, "dur": 1.342, "args": { "External id": 22212,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4803 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755416.363, "dur": 3.788, "args": { "External id": 22213,"Record function id": 0, "Ev Idx": 4804 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755417.630, "dur": 2.097, "args": { "External id": 22214,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755418.124, "dur": 1.182, "args": { "External id": 22215,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4806 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755418.464, "dur": 0.736, "args": { "External id": 22216,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4807 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755423.170, "dur": 6.770, "args": { "External id": 22217,"Record function id": 0, "Ev Idx": 4808 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755424.179, "dur": 5.334, "args": { "External id": 22218,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755424.930, "dur": 1.167, "args": { "External id": 22219,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4810 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755425.417, "dur": 0.606, "args": { "External id": 22220,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4811 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755433.195, "dur": 3.638, "args": { "External id": 22221,"Record function id": 0, "Ev Idx": 4812 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755434.083, "dur": 2.327, "args": { "External id": 22222,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755434.763, "dur": 1.213, "args": { "External id": 22223,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4814 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755435.467, "dur": 0.440, "args": { "External id": 22224,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4815 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755439.924, "dur": 3.466, "args": { "External id": 22225,"Record function id": 0, "Ev Idx": 4816 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755440.891, "dur": 2.082, "args": { "External id": 22226,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755441.502, "dur": 1.060, "args": { "External id": 22227,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4818 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755441.771, "dur": 0.691, "args": { "External id": 22228,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4819 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755446.408, "dur": 3.752, "args": { "External id": 22229,"Record function id": 0, "Ev Idx": 4820 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755447.409, "dur": 2.329, "args": { "External id": 22230,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755447.867, "dur": 1.387, "args": { "External id": 22231,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4822 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755448.116, "dur": 1.036, "args": { "External id": 22232,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4823 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755453.108, "dur": 5.440, "args": { "External id": 22233,"Record function id": 0, "Ev Idx": 4824 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651755454.172, "dur": 3.966, "args": { "External id": 22234,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755454.673, "dur": 3.028, "args": { "External id": 22235,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4826 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651755456.807, "dur": 0.796, "args": { "External id": 22236,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4827 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651755462.100, "dur": 35684.916, "args": { "External id": 22237,"Record function id": 0, "Sequence number": 246553, "Fwd thread id": 1, "Ev Idx": 4828 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651755463.357, "dur": 35675.007, "args": { "External id": 22238,"Sequence number": 246553, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4829 } }, { "ph": "f", "id": 215, "pid": 1336759, "tid": 1381173, "ts": 1295651755463.357, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.6)", "pid": 1336759, "tid": 1381173, "ts": 1295651755493.702, "dur": 36.919, "args": { "External id": 22239,"Record function id": 0, "Ev Idx": 4830 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.6)", "pid": 1336759, "tid": 1381173, "ts": 1295651755537.969, "dur": 68.488, "args": { "External id": 22240,"Record function id": 0, "Ev Idx": 4831 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.6)", "pid": 1336759, "tid": 1381173, "ts": 1295651755611.892, "dur": 35518.175, "args": { "External id": 22241,"Record function id": 0, "Ev Idx": 4832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651755700.915, "dur": 6.496, "args": { "External id": 22242,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651755716.324, "dur": 7.816, "args": { "External id": 22243,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4834 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651755738.535, "dur": 34621.259, "args": { "External id": 22244,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651755752.994, "dur": 34597.825, "args": { "External id": 22245,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651755806.060, "dur": 14.398, "args": { "External id": 22246,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651755826.640, "dur": 34488.414, "args": { "External id": 22247,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651755829.315, "dur": 34485.123, "args": { "External id": 22248,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651755832.824, "dur": 8.160, "args": { "External id": 22249,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651755842.557, "dur": 34468.416, "args": { "External id": 22250,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651790446.151, "dur": 9.926, "args": { "External id": 22251,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651790448.967, "dur": 6.824, "args": { "External id": 22252,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4843 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651790482.024, "dur": 334.309, "args": { "External id": 22253,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4844 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651790512.348, "dur": 299.374, "args": { "External id": 22254,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4845, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651790523.046, "dur": 283.989, "args": { "External id": 22255,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4846 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651790836.872, "dur": 2.038, "args": { "External id": 22256,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4847, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651790893.777, "dur": 6.977, "args": { "External id": 22257,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651790943.874, "dur": 1.206, "args": { "External id": 22258,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651790959.369, "dur": 0.936, "args": { "External id": 22259,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651790970.734, "dur": 1.133, "args": { "External id": 22260,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791019.205, "dur": 1.664, "args": { "External id": 22261,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791035.603, "dur": 0.940, "args": { "External id": 22262,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791046.502, "dur": 0.774, "args": { "External id": 22263,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791056.850, "dur": 1.246, "args": { "External id": 22264,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791067.562, "dur": 0.934, "args": { "External id": 22265,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4856 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651791163.210, "dur": 2590.434, "args": { "External id": 22266,"Record function id": 0, "Ev Idx": 4857 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.5)", "pid": 1336759, "tid": 1381173, "ts": 1295651791182.463, "dur": 969.873, "args": { "External id": 22267,"Record function id": 0, "Ev Idx": 4858 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.5)", "pid": 1336759, "tid": 1381173, "ts": 1295651791197.535, "dur": 325.364, "args": { "External id": 22268,"Record function id": 0, "Ev Idx": 4859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651791291.906, "dur": 4.965, "args": { "External id": 22269,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651791300.242, "dur": 0.758, "args": { "External id": 22270,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651791302.496, "dur": 1.135, "args": { "External id": 22271,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651791306.781, "dur": 1.043, "args": { "External id": 22272,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651791309.231, "dur": 1.022, "args": { "External id": 22273,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651791311.542, "dur": 1.346, "args": { "External id": 22274,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651791314.435, "dur": 0.647, "args": { "External id": 22275,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651791317.744, "dur": 1.430, "args": { "External id": 22276,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651791320.809, "dur": 1.025, "args": { "External id": 22277,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651791323.198, "dur": 0.487, "args": { "External id": 22278,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4869 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651791342.535, "dur": 152.123, "args": { "External id": 22279,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651791358.605, "dur": 131.671, "args": { "External id": 22280,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651791379.346, "dur": 12.787, "args": { "External id": 22281,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651791395.289, "dur": 68.830, "args": { "External id": 22282,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651791399.449, "dur": 64.375, "args": { "External id": 22283,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791402.803, "dur": 5.287, "args": { "External id": 22284,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651791409.873, "dur": 53.314, "args": { "External id": 22285,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4876 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.4", "pid": 1336759, "tid": 1381173, "ts": 1295651791602.214, "dur": 542.413, "args": { "External id": 22286,"Record function id": 0, "Ev Idx": 4877 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.4)", "pid": 1336759, "tid": 1381173, "ts": 1295651791617.194, "dur": 514.974, "args": { "External id": 22287,"Record function id": 0, "Ev Idx": 4878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651791671.155, "dur": 4.906, "args": { "External id": 22288,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651791691.319, "dur": 22.216, "args": { "External id": 22289,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791695.827, "dur": 1.818, "args": { "External id": 22290,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791699.384, "dur": 0.449, "args": { "External id": 22291,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791701.013, "dur": 0.340, "args": { "External id": 22292,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791702.291, "dur": 0.338, "args": { "External id": 22293,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791704.080, "dur": 0.391, "args": { "External id": 22294,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791705.184, "dur": 0.459, "args": { "External id": 22295,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791706.359, "dur": 0.321, "args": { "External id": 22296,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791708.086, "dur": 0.798, "args": { "External id": 22297,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791710.084, "dur": 0.700, "args": { "External id": 22298,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651791722.126, "dur": 27.266, "args": { "External id": 22299,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4890 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651791777.888, "dur": 85.316, "args": { "External id": 22300,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651791786.601, "dur": 2.892, "args": { "External id": 22301,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651791794.399, "dur": 10.733, "args": { "External id": 22302,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651791798.514, "dur": 6.187, "args": { "External id": 22303,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791802.037, "dur": 0.704, "args": { "External id": 22304,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651791811.421, "dur": 19.102, "args": { "External id": 22305,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791813.058, "dur": 0.715, "args": { "External id": 22306,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791815.348, "dur": 0.387, "args": { "External id": 22307,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791816.942, "dur": 0.503, "args": { "External id": 22308,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791818.482, "dur": 0.317, "args": { "External id": 22309,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791819.363, "dur": 0.177, "args": { "External id": 22310,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791820.380, "dur": 0.609, "args": { "External id": 22311,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791822.267, "dur": 0.416, "args": { "External id": 22312,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791823.212, "dur": 0.201, "args": { "External id": 22313,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651791824.105, "dur": 1.164, "args": { "External id": 22314,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651791839.343, "dur": 16.965, "args": { "External id": 22315,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4906 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651791904.545, "dur": 152.508, "args": { "External id": 22316,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4907 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651791928.756, "dur": 124.204, "args": { "External id": 22317,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4908, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651791937.613, "dur": 110.625, "args": { "External id": 22318,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4909 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651792073.845, "dur": 2.163, "args": { "External id": 22319,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4910, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651792158.647, "dur": 1573.471, "args": { "External id": 22320,"Sequence number": 246552, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4911 } }, { "ph": "f", "id": 216, "pid": 1336759, "tid": 1381173, "ts": 1295651792158.647, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651792292.124, "dur": 108.056, "args": { "External id": 22321,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4912 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651792438.903, "dur": 40.510, "args": { "External id": 22322,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651792494.315, "dur": 49.912, "args": { "External id": 22323,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651792553.546, "dur": 31.160, "args": { "External id": 22324,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651792594.156, "dur": 45.117, "args": { "External id": 22325,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651792646.540, "dur": 26.775, "args": { "External id": 22326,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651792681.099, "dur": 40.897, "args": { "External id": 22327,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4918 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651792745.307, "dur": 19.760, "args": { "External id": 22328,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4919 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651792782.015, "dur": 26.532, "args": { "External id": 22329,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4920 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651792829.564, "dur": 18.551, "args": { "External id": 22330,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4921 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651792859.115, "dur": 13.625, "args": { "External id": 22331,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651792880.222, "dur": 26.757, "args": { "External id": 22332,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651792910.147, "dur": 31.204, "args": { "External id": 22333,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4924 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651792966.621, "dur": 210.806, "args": { "External id": 22334,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651793082.625, "dur": 6.686, "args": { "External id": 22335,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651793091.769, "dur": 2.601, "args": { "External id": 22336,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4927 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651793209.855, "dur": 45.561, "args": { "External id": 22337,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4928 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651793272.044, "dur": 15.546, "args": { "External id": 22338,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651793298.430, "dur": 42.925, "args": { "External id": 22339,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651793347.707, "dur": 35.017, "args": { "External id": 22340,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651793389.673, "dur": 19.930, "args": { "External id": 22341,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651793414.020, "dur": 29.016, "args": { "External id": 22342,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651793449.071, "dur": 18.709, "args": { "External id": 22343,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651793473.800, "dur": 29.414, "args": { "External id": 22344,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4935 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651793522.383, "dur": 21.561, "args": { "External id": 22345,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4936 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651793563.755, "dur": 22.850, "args": { "External id": 22346,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4937 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651793613.545, "dur": 26.349, "args": { "External id": 22347,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4938 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651793658.236, "dur": 12.972, "args": { "External id": 22348,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4939 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651793688.718, "dur": 15.186, "args": { "External id": 22349,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4940 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793775.436, "dur": 14.673, "args": { "External id": 22350,"Record function id": 0, "Ev Idx": 4941 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793778.566, "dur": 10.562, "args": { "External id": 22351,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793782.601, "dur": 5.770, "args": { "External id": 22352,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4943 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793784.015, "dur": 4.262, "args": { "External id": 22353,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4944 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793793.979, "dur": 4.271, "args": { "External id": 22354,"Record function id": 0, "Ev Idx": 4945 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793795.160, "dur": 2.630, "args": { "External id": 22355,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793795.924, "dur": 1.416, "args": { "External id": 22356,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4947 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793796.419, "dur": 0.815, "args": { "External id": 22357,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4948 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793804.273, "dur": 4.575, "args": { "External id": 22358,"Record function id": 0, "Ev Idx": 4949 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793805.374, "dur": 3.020, "args": { "External id": 22359,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793806.081, "dur": 1.881, "args": { "External id": 22360,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4951 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793806.628, "dur": 1.241, "args": { "External id": 22361,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4952 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793811.962, "dur": 3.611, "args": { "External id": 22362,"Record function id": 0, "Ev Idx": 4953 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793813.125, "dur": 1.999, "args": { "External id": 22363,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793813.727, "dur": 0.992, "args": { "External id": 22364,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4955 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793814.000, "dur": 0.624, "args": { "External id": 22365,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4956 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793818.584, "dur": 3.996, "args": { "External id": 22366,"Record function id": 0, "Ev Idx": 4957 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793819.696, "dur": 2.446, "args": { "External id": 22367,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793820.187, "dur": 1.537, "args": { "External id": 22368,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4959 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793820.733, "dur": 0.917, "args": { "External id": 22369,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4960 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793825.664, "dur": 3.599, "args": { "External id": 22370,"Record function id": 0, "Ev Idx": 4961 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793826.670, "dur": 2.139, "args": { "External id": 22371,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793827.195, "dur": 1.184, "args": { "External id": 22372,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4963 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793827.687, "dur": 0.621, "args": { "External id": 22373,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4964 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793832.402, "dur": 3.227, "args": { "External id": 22374,"Record function id": 0, "Ev Idx": 4965 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793833.382, "dur": 1.815, "args": { "External id": 22375,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793833.859, "dur": 0.940, "args": { "External id": 22376,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4967 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793834.128, "dur": 0.596, "args": { "External id": 22377,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4968 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793838.650, "dur": 3.425, "args": { "External id": 22378,"Record function id": 0, "Ev Idx": 4969 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793839.708, "dur": 1.924, "args": { "External id": 22379,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793840.196, "dur": 1.034, "args": { "External id": 22380,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4971 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793840.450, "dur": 0.704, "args": { "External id": 22381,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4972 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793845.030, "dur": 5.145, "args": { "External id": 22382,"Record function id": 0, "Ev Idx": 4973 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651793845.978, "dur": 3.714, "args": { "External id": 22383,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793846.515, "dur": 2.761, "args": { "External id": 22384,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4975 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651793848.375, "dur": 0.826, "args": { "External id": 22385,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4976 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651793853.801, "dur": 38107.446, "args": { "External id": 22386,"Record function id": 0, "Sequence number": 246551, "Fwd thread id": 1, "Ev Idx": 4977 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651793854.995, "dur": 38097.949, "args": { "External id": 22387,"Sequence number": 246551, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4978 } }, { "ph": "f", "id": 217, "pid": 1336759, "tid": 1381173, "ts": 1295651793854.995, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.5)", "pid": 1336759, "tid": 1381173, "ts": 1295651793886.336, "dur": 42.830, "args": { "External id": 22388,"Record function id": 0, "Ev Idx": 4979 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.5)", "pid": 1336759, "tid": 1381173, "ts": 1295651793936.340, "dur": 109.588, "args": { "External id": 22389,"Record function id": 0, "Ev Idx": 4980 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.5)", "pid": 1336759, "tid": 1381173, "ts": 1295651794053.920, "dur": 37891.102, "args": { "External id": 22390,"Record function id": 0, "Ev Idx": 4981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651794147.263, "dur": 10.021, "args": { "External id": 22391,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651794167.170, "dur": 5.446, "args": { "External id": 22392,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4983 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651794187.560, "dur": 36951.482, "args": { "External id": 22393,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651794201.427, "dur": 36928.510, "args": { "External id": 22394,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651794273.475, "dur": 14.945, "args": { "External id": 22395,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651794294.726, "dur": 36799.984, "args": { "External id": 22396,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651794297.110, "dur": 36796.905, "args": { "External id": 22397,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651794300.747, "dur": 6.416, "args": { "External id": 22398,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651794308.872, "dur": 36781.553, "args": { "External id": 22399,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651831245.686, "dur": 11.280, "args": { "External id": 22400,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651831249.402, "dur": 7.069, "args": { "External id": 22401,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4992 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651831285.808, "dur": 387.379, "args": { "External id": 22402,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4993 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651831314.083, "dur": 354.322, "args": { "External id": 22403,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4994, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651831325.025, "dur": 337.680, "args": { "External id": 22404,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4995 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651831693.184, "dur": 2.549, "args": { "External id": 22405,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4996, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651831754.618, "dur": 6.458, "args": { "External id": 22406,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651831803.815, "dur": 1.220, "args": { "External id": 22407,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651831820.355, "dur": 1.224, "args": { "External id": 22408,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651831832.324, "dur": 0.954, "args": { "External id": 22409,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651831843.830, "dur": 0.930, "args": { "External id": 22410,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651831854.186, "dur": 0.760, "args": { "External id": 22411,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651831864.123, "dur": 1.140, "args": { "External id": 22412,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651831874.948, "dur": 1.228, "args": { "External id": 22413,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651831884.335, "dur": 0.927, "args": { "External id": 22414,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5005 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651831975.054, "dur": 2636.101, "args": { "External id": 22415,"Record function id": 0, "Ev Idx": 5006 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.4)", "pid": 1336759, "tid": 1381173, "ts": 1295651832034.815, "dur": 923.887, "args": { "External id": 22416,"Record function id": 0, "Ev Idx": 5007 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.4)", "pid": 1336759, "tid": 1381173, "ts": 1295651832050.538, "dur": 324.261, "args": { "External id": 22417,"Record function id": 0, "Ev Idx": 5008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651832127.222, "dur": 4.820, "args": { "External id": 22418,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651832135.097, "dur": 0.982, "args": { "External id": 22419,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651832139.228, "dur": 1.502, "args": { "External id": 22420,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651832142.123, "dur": 0.958, "args": { "External id": 22421,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651832144.381, "dur": 0.518, "args": { "External id": 22422,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651832146.079, "dur": 1.148, "args": { "External id": 22423,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651832149.769, "dur": 0.710, "args": { "External id": 22424,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5015 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651832151.674, "dur": 0.960, "args": { "External id": 22425,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651832153.885, "dur": 0.981, "args": { "External id": 22426,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651832156.135, "dur": 0.431, "args": { "External id": 22427,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5018 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651832175.819, "dur": 166.551, "args": { "External id": 22428,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651832191.902, "dur": 145.273, "args": { "External id": 22429,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651832212.441, "dur": 12.571, "args": { "External id": 22430,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651832243.062, "dur": 67.676, "args": { "External id": 22431,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 5022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651832246.373, "dur": 64.077, "args": { "External id": 22432,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 5023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832250.429, "dur": 5.919, "args": { "External id": 22433,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651832258.112, "dur": 51.672, "args": { "External id": 22434,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 5025 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.3", "pid": 1336759, "tid": 1381173, "ts": 1295651832455.145, "dur": 496.318, "args": { "External id": 22435,"Record function id": 0, "Ev Idx": 5026 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.3)", "pid": 1336759, "tid": 1381173, "ts": 1295651832471.058, "dur": 468.613, "args": { "External id": 22436,"Record function id": 0, "Ev Idx": 5027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651832526.712, "dur": 4.764, "args": { "External id": 22437,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651832547.505, "dur": 23.471, "args": { "External id": 22438,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832552.412, "dur": 1.782, "args": { "External id": 22439,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832555.964, "dur": 0.414, "args": { "External id": 22440,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832557.470, "dur": 0.406, "args": { "External id": 22441,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832559.314, "dur": 0.543, "args": { "External id": 22442,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832561.142, "dur": 0.285, "args": { "External id": 22443,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832562.438, "dur": 0.406, "args": { "External id": 22444,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832563.610, "dur": 0.748, "args": { "External id": 22445,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832565.784, "dur": 0.310, "args": { "External id": 22446,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832566.922, "dur": 0.526, "args": { "External id": 22447,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651832579.643, "dur": 27.463, "args": { "External id": 22448,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5039 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651832636.058, "dur": 81.629, "args": { "External id": 22449,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 5040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651832645.629, "dur": 3.010, "args": { "External id": 22450,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651832653.350, "dur": 9.916, "args": { "External id": 22451,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651832657.482, "dur": 5.367, "args": { "External id": 22452,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 5043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832660.758, "dur": 0.818, "args": { "External id": 22453,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651832669.599, "dur": 16.890, "args": { "External id": 22454,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832670.826, "dur": 0.469, "args": { "External id": 22455,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832672.338, "dur": 0.384, "args": { "External id": 22456,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832673.613, "dur": 0.571, "args": { "External id": 22457,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832675.253, "dur": 0.164, "args": { "External id": 22458,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832675.987, "dur": 0.199, "args": { "External id": 22459,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832676.731, "dur": 0.618, "args": { "External id": 22460,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832679.161, "dur": 0.415, "args": { "External id": 22461,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832680.388, "dur": 0.302, "args": { "External id": 22462,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651832681.211, "dur": 0.254, "args": { "External id": 22463,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651832694.488, "dur": 16.444, "args": { "External id": 22464,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5055 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651832759.514, "dur": 113.475, "args": { "External id": 22465,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 5056 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651832784.936, "dur": 84.475, "args": { "External id": 22466,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5057, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651832794.514, "dur": 70.638, "args": { "External id": 22467,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 5058 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651832891.901, "dur": 1.728, "args": { "External id": 22468,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5059, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651832965.844, "dur": 1623.511, "args": { "External id": 22469,"Sequence number": 246550, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5060 } }, { "ph": "f", "id": 218, "pid": 1336759, "tid": 1381173, "ts": 1295651832965.844, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651833117.367, "dur": 108.799, "args": { "External id": 22470,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 5061 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651833288.254, "dur": 38.292, "args": { "External id": 22471,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 5062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651833346.866, "dur": 54.242, "args": { "External id": 22472,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 5063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651833410.409, "dur": 31.677, "args": { "External id": 22473,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651833448.705, "dur": 44.879, "args": { "External id": 22474,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651833500.344, "dur": 26.545, "args": { "External id": 22475,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651833533.293, "dur": 43.140, "args": { "External id": 22476,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5067 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651833598.247, "dur": 20.811, "args": { "External id": 22477,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 5068 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651833639.351, "dur": 25.775, "args": { "External id": 22478,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5069 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651833687.163, "dur": 18.002, "args": { "External id": 22479,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5070 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651833721.856, "dur": 13.575, "args": { "External id": 22480,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651833743.154, "dur": 30.348, "args": { "External id": 22481,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651833776.737, "dur": 30.892, "args": { "External id": 22482,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5073 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651833833.052, "dur": 203.215, "args": { "External id": 22483,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 5074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651833905.965, "dur": 6.335, "args": { "External id": 22484,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651833914.328, "dur": 2.693, "args": { "External id": 22485,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5076 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651834069.901, "dur": 27.151, "args": { "External id": 22486,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5077 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651834108.616, "dur": 13.789, "args": { "External id": 22487,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651834131.401, "dur": 38.283, "args": { "External id": 22488,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651834175.642, "dur": 33.815, "args": { "External id": 22489,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651834215.908, "dur": 35.920, "args": { "External id": 22490,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651834259.192, "dur": 32.221, "args": { "External id": 22491,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651834298.270, "dur": 19.864, "args": { "External id": 22492,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651834324.025, "dur": 29.922, "args": { "External id": 22493,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5084 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651834374.842, "dur": 23.278, "args": { "External id": 22494,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 5085 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651834413.517, "dur": 25.138, "args": { "External id": 22495,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5086 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651834456.973, "dur": 34.228, "args": { "External id": 22496,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5087 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651834514.155, "dur": 13.929, "args": { "External id": 22497,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5088 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651834544.116, "dur": 15.488, "args": { "External id": 22498,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 5089 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834633.887, "dur": 14.390, "args": { "External id": 22499,"Record function id": 0, "Ev Idx": 5090 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834636.811, "dur": 10.408, "args": { "External id": 22500,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834640.835, "dur": 5.559, "args": { "External id": 22501,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5092 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834642.152, "dur": 4.115, "args": { "External id": 22502,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5093 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834652.216, "dur": 7.645, "args": { "External id": 22503,"Record function id": 0, "Ev Idx": 5094 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834653.634, "dur": 5.792, "args": { "External id": 22504,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834657.645, "dur": 1.362, "args": { "External id": 22505,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5096 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834658.080, "dur": 0.859, "args": { "External id": 22506,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5097 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834663.208, "dur": 3.820, "args": { "External id": 22507,"Record function id": 0, "Ev Idx": 5098 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834664.166, "dur": 2.403, "args": { "External id": 22508,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834664.741, "dur": 1.410, "args": { "External id": 22509,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5100 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834665.224, "dur": 0.827, "args": { "External id": 22510,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5101 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834670.197, "dur": 3.659, "args": { "External id": 22511,"Record function id": 0, "Ev Idx": 5102 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834671.270, "dur": 2.174, "args": { "External id": 22512,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834671.842, "dur": 1.172, "args": { "External id": 22513,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5104 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834672.110, "dur": 0.801, "args": { "External id": 22514,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5105 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834676.868, "dur": 3.799, "args": { "External id": 22515,"Record function id": 0, "Ev Idx": 5106 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834677.957, "dur": 2.273, "args": { "External id": 22516,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834678.449, "dur": 1.317, "args": { "External id": 22517,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5108 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834678.758, "dur": 0.933, "args": { "External id": 22518,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5109 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834683.742, "dur": 3.546, "args": { "External id": 22519,"Record function id": 0, "Ev Idx": 5110 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834684.796, "dur": 2.032, "args": { "External id": 22520,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834685.261, "dur": 1.132, "args": { "External id": 22521,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5112 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834685.668, "dur": 0.655, "args": { "External id": 22522,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5113 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834690.340, "dur": 3.348, "args": { "External id": 22523,"Record function id": 0, "Ev Idx": 5114 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834691.243, "dur": 2.034, "args": { "External id": 22524,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834691.700, "dur": 1.173, "args": { "External id": 22525,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5116 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834691.953, "dur": 0.846, "args": { "External id": 22526,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5117 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834696.714, "dur": 39.364, "args": { "External id": 22527,"Record function id": 0, "Ev Idx": 5118 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834697.643, "dur": 37.987, "args": { "External id": 22528,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834731.146, "dur": 4.034, "args": { "External id": 22529,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5120 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834733.407, "dur": 1.664, "args": { "External id": 22530,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5121 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834739.154, "dur": 3.398, "args": { "External id": 22531,"Record function id": 0, "Ev Idx": 5122 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651834740.314, "dur": 1.826, "args": { "External id": 22532,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834740.841, "dur": 0.907, "args": { "External id": 22533,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5124 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651834741.101, "dur": 0.559, "args": { "External id": 22534,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5125 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651834745.836, "dur": 36315.600, "args": { "External id": 22535,"Record function id": 0, "Sequence number": 246549, "Fwd thread id": 1, "Ev Idx": 5126 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651834747.014, "dur": 36304.801, "args": { "External id": 22536,"Sequence number": 246549, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5127 } }, { "ph": "f", "id": 219, "pid": 1336759, "tid": 1381173, "ts": 1295651834747.014, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.4)", "pid": 1336759, "tid": 1381173, "ts": 1295651834775.886, "dur": 40.208, "args": { "External id": 22537,"Record function id": 0, "Ev Idx": 5128 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.4)", "pid": 1336759, "tid": 1381173, "ts": 1295651834823.895, "dur": 62.271, "args": { "External id": 22538,"Record function id": 0, "Ev Idx": 5129 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.4)", "pid": 1336759, "tid": 1381173, "ts": 1295651834891.343, "dur": 36151.795, "args": { "External id": 22539,"Record function id": 0, "Ev Idx": 5130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651834979.792, "dur": 50.844, "args": { "External id": 22540,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651835044.305, "dur": 5.477, "args": { "External id": 22541,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5132 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651835066.663, "dur": 35213.992, "args": { "External id": 22542,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651835080.204, "dur": 35191.263, "args": { "External id": 22543,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651835129.121, "dur": 14.522, "args": { "External id": 22544,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651835150.039, "dur": 35069.806, "args": { "External id": 22545,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 5136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651835152.572, "dur": 35066.598, "args": { "External id": 22546,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 5137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651835156.203, "dur": 5.234, "args": { "External id": 22547,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651835163.017, "dur": 35052.920, "args": { "External id": 22548,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 5139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651870367.525, "dur": 9.812, "args": { "External id": 22549,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 5140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651870370.243, "dur": 6.714, "args": { "External id": 22550,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5141 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651870404.125, "dur": 331.578, "args": { "External id": 22551,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 5142 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651870432.472, "dur": 298.807, "args": { "External id": 22552,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5143, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651870443.498, "dur": 282.582, "args": { "External id": 22553,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 5144 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651870753.498, "dur": 1.840, "args": { "External id": 22554,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5145, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651870807.261, "dur": 6.437, "args": { "External id": 22555,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651870857.119, "dur": 2.070, "args": { "External id": 22556,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651870873.738, "dur": 1.009, "args": { "External id": 22557,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651870885.595, "dur": 1.134, "args": { "External id": 22558,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651870897.097, "dur": 1.219, "args": { "External id": 22559,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651870907.282, "dur": 1.069, "args": { "External id": 22560,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651870919.350, "dur": 0.738, "args": { "External id": 22561,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651870930.609, "dur": 0.888, "args": { "External id": 22562,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651870943.900, "dur": 0.960, "args": { "External id": 22563,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5154 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651871078.114, "dur": 2594.834, "args": { "External id": 22564,"Record function id": 0, "Ev Idx": 5155 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.3)", "pid": 1336759, "tid": 1381173, "ts": 1295651871096.981, "dur": 986.038, "args": { "External id": 22565,"Record function id": 0, "Ev Idx": 5156 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.3)", "pid": 1336759, "tid": 1381173, "ts": 1295651871112.645, "dur": 331.017, "args": { "External id": 22566,"Record function id": 0, "Ev Idx": 5157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651871188.587, "dur": 4.536, "args": { "External id": 22567,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651871196.119, "dur": 0.986, "args": { "External id": 22568,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651871200.949, "dur": 1.106, "args": { "External id": 22569,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651871203.588, "dur": 1.005, "args": { "External id": 22570,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651871206.051, "dur": 1.329, "args": { "External id": 22571,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651871208.796, "dur": 1.140, "args": { "External id": 22572,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651871213.362, "dur": 0.787, "args": { "External id": 22573,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651871215.375, "dur": 1.037, "args": { "External id": 22574,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651871217.708, "dur": 1.471, "args": { "External id": 22575,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651871220.546, "dur": 0.553, "args": { "External id": 22576,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5167 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651871258.463, "dur": 151.768, "args": { "External id": 22577,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651871274.980, "dur": 130.409, "args": { "External id": 22578,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651871297.824, "dur": 12.753, "args": { "External id": 22579,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651871313.823, "dur": 65.018, "args": { "External id": 22580,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 5171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651871316.490, "dur": 62.028, "args": { "External id": 22581,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 5172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871320.117, "dur": 5.521, "args": { "External id": 22582,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651871327.268, "dur": 50.640, "args": { "External id": 22583,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 5174 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.2", "pid": 1336759, "tid": 1381173, "ts": 1295651871525.550, "dur": 549.501, "args": { "External id": 22584,"Record function id": 0, "Ev Idx": 5175 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.2)", "pid": 1336759, "tid": 1381173, "ts": 1295651871542.015, "dur": 516.931, "args": { "External id": 22585,"Record function id": 0, "Ev Idx": 5176 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651871597.000, "dur": 4.522, "args": { "External id": 22586,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651871616.476, "dur": 22.351, "args": { "External id": 22587,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871621.006, "dur": 1.537, "args": { "External id": 22588,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871624.643, "dur": 0.774, "args": { "External id": 22589,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871626.684, "dur": 0.622, "args": { "External id": 22590,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871629.176, "dur": 0.312, "args": { "External id": 22591,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871630.385, "dur": 0.277, "args": { "External id": 22592,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871631.377, "dur": 0.173, "args": { "External id": 22593,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871632.503, "dur": 0.623, "args": { "External id": 22594,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871634.189, "dur": 0.648, "args": { "External id": 22595,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871635.425, "dur": 0.256, "args": { "External id": 22596,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651871647.619, "dur": 28.313, "args": { "External id": 22597,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5188 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651871704.548, "dur": 84.783, "args": { "External id": 22598,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 5189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651871713.158, "dur": 3.022, "args": { "External id": 22599,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651871720.636, "dur": 9.961, "args": { "External id": 22600,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651871724.770, "dur": 5.423, "args": { "External id": 22601,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 5192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871727.834, "dur": 0.973, "args": { "External id": 22602,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651871736.550, "dur": 20.785, "args": { "External id": 22603,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871738.128, "dur": 0.448, "args": { "External id": 22604,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871739.464, "dur": 0.221, "args": { "External id": 22605,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871741.550, "dur": 0.473, "args": { "External id": 22606,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871743.109, "dur": 0.283, "args": { "External id": 22607,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871743.943, "dur": 0.182, "args": { "External id": 22608,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871744.845, "dur": 0.500, "args": { "External id": 22609,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871746.707, "dur": 0.589, "args": { "External id": 22610,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871747.970, "dur": 0.414, "args": { "External id": 22611,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651871748.978, "dur": 0.298, "args": { "External id": 22612,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651871765.041, "dur": 17.175, "args": { "External id": 22613,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5204 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651871832.775, "dur": 110.817, "args": { "External id": 22614,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 5205 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651871856.726, "dur": 83.497, "args": { "External id": 22615,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5206, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651871867.287, "dur": 69.106, "args": { "External id": 22616,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 5207 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651871963.076, "dur": 1.833, "args": { "External id": 22617,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5208, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651872090.397, "dur": 1565.084, "args": { "External id": 22618,"Sequence number": 246548, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5209 } }, { "ph": "f", "id": 220, "pid": 1336759, "tid": 1381173, "ts": 1295651872090.397, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651872203.577, "dur": 124.293, "args": { "External id": 22619,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 5210 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651872372.433, "dur": 37.983, "args": { "External id": 22620,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 5211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651872426.021, "dur": 48.273, "args": { "External id": 22621,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 5212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651872483.161, "dur": 31.785, "args": { "External id": 22622,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651872521.562, "dur": 44.264, "args": { "External id": 22623,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651872573.067, "dur": 27.901, "args": { "External id": 22624,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651872608.634, "dur": 41.437, "args": { "External id": 22625,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5216 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651872671.927, "dur": 20.469, "args": { "External id": 22626,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 5217 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651872712.340, "dur": 26.191, "args": { "External id": 22627,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5218 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651872762.025, "dur": 17.431, "args": { "External id": 22628,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5219 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651872790.099, "dur": 13.356, "args": { "External id": 22629,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651872811.341, "dur": 26.892, "args": { "External id": 22630,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651872841.594, "dur": 30.843, "args": { "External id": 22631,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5222 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651872897.439, "dur": 207.767, "args": { "External id": 22632,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 5223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651872970.665, "dur": 5.965, "args": { "External id": 22633,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651872978.510, "dur": 1.932, "args": { "External id": 22634,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5225 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651873140.166, "dur": 26.548, "args": { "External id": 22635,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5226 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651873177.402, "dur": 12.932, "args": { "External id": 22636,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651873198.705, "dur": 58.339, "args": { "External id": 22637,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651873265.550, "dur": 37.361, "args": { "External id": 22638,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651873310.081, "dur": 20.326, "args": { "External id": 22639,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651873334.860, "dur": 28.798, "args": { "External id": 22640,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651873369.577, "dur": 22.680, "args": { "External id": 22641,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651873398.823, "dur": 28.480, "args": { "External id": 22642,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5233 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651873450.294, "dur": 21.973, "args": { "External id": 22643,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 5234 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651873488.544, "dur": 21.451, "args": { "External id": 22644,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5235 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651873541.928, "dur": 22.635, "args": { "External id": 22645,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5236 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651873584.284, "dur": 13.265, "args": { "External id": 22646,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5237 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651873610.132, "dur": 14.287, "args": { "External id": 22647,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 5238 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873698.502, "dur": 14.325, "args": { "External id": 22648,"Record function id": 0, "Ev Idx": 5239 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873701.504, "dur": 10.328, "args": { "External id": 22649,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873705.412, "dur": 5.577, "args": { "External id": 22650,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5241 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873706.734, "dur": 4.137, "args": { "External id": 22651,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5242 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873716.536, "dur": 4.319, "args": { "External id": 22652,"Record function id": 0, "Ev Idx": 5243 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873717.803, "dur": 2.595, "args": { "External id": 22653,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873718.577, "dur": 1.347, "args": { "External id": 22654,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5245 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873719.054, "dur": 0.797, "args": { "External id": 22655,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5246 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873724.044, "dur": 4.259, "args": { "External id": 22656,"Record function id": 0, "Ev Idx": 5247 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873725.151, "dur": 2.673, "args": { "External id": 22657,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873725.944, "dur": 1.455, "args": { "External id": 22658,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5249 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873726.598, "dur": 0.693, "args": { "External id": 22659,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5250 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873731.578, "dur": 3.688, "args": { "External id": 22660,"Record function id": 0, "Ev Idx": 5251 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873732.575, "dur": 2.268, "args": { "External id": 22661,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873733.156, "dur": 1.311, "args": { "External id": 22662,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5253 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873733.781, "dur": 0.569, "args": { "External id": 22663,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5254 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873738.353, "dur": 3.517, "args": { "External id": 22664,"Record function id": 0, "Ev Idx": 5255 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873739.307, "dur": 2.125, "args": { "External id": 22665,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873740.081, "dur": 0.943, "args": { "External id": 22666,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5257 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873740.416, "dur": 0.543, "args": { "External id": 22667,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5258 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873744.845, "dur": 3.887, "args": { "External id": 22668,"Record function id": 0, "Ev Idx": 5259 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873745.833, "dur": 2.502, "args": { "External id": 22669,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873746.309, "dur": 1.634, "args": { "External id": 22670,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5261 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873746.761, "dur": 1.114, "args": { "External id": 22671,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5262 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873751.939, "dur": 6.517, "args": { "External id": 22672,"Record function id": 0, "Ev Idx": 5263 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873756.056, "dur": 1.968, "args": { "External id": 22673,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873756.689, "dur": 0.950, "args": { "External id": 22674,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5265 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873756.950, "dur": 0.614, "args": { "External id": 22675,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5266 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873761.421, "dur": 7.495, "args": { "External id": 22676,"Record function id": 0, "Ev Idx": 5267 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873762.424, "dur": 6.042, "args": { "External id": 22677,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873765.612, "dur": 2.462, "args": { "External id": 22678,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5269 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873767.413, "dur": 0.590, "args": { "External id": 22679,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5270 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873771.996, "dur": 3.226, "args": { "External id": 22680,"Record function id": 0, "Ev Idx": 5271 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651873772.945, "dur": 1.815, "args": { "External id": 22681,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873773.412, "dur": 0.934, "args": { "External id": 22682,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5273 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651873773.687, "dur": 0.594, "args": { "External id": 22683,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5274 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651873778.834, "dur": 36547.649, "args": { "External id": 22684,"Record function id": 0, "Sequence number": 246547, "Fwd thread id": 1, "Ev Idx": 5275 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651873780.274, "dur": 36534.120, "args": { "External id": 22685,"Sequence number": 246547, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5276 } }, { "ph": "f", "id": 221, "pid": 1336759, "tid": 1381173, "ts": 1295651873780.274, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.3)", "pid": 1336759, "tid": 1381173, "ts": 1295651873806.500, "dur": 39.434, "args": { "External id": 22686,"Record function id": 0, "Ev Idx": 5277 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.3)", "pid": 1336759, "tid": 1381173, "ts": 1295651873853.270, "dur": 62.521, "args": { "External id": 22687,"Record function id": 0, "Ev Idx": 5278 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.3)", "pid": 1336759, "tid": 1381173, "ts": 1295651873921.104, "dur": 36384.774, "args": { "External id": 22688,"Record function id": 0, "Ev Idx": 5279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651874050.436, "dur": 7.818, "args": { "External id": 22689,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651874069.063, "dur": 5.185, "args": { "External id": 22690,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5281 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651874091.385, "dur": 35395.866, "args": { "External id": 22691,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651874105.142, "dur": 35372.748, "args": { "External id": 22692,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651874150.038, "dur": 16.654, "args": { "External id": 22693,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651874172.969, "dur": 35268.303, "args": { "External id": 22694,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 5285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651874175.413, "dur": 35265.140, "args": { "External id": 22695,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 5286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651874179.096, "dur": 6.315, "args": { "External id": 22696,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651874186.947, "dur": 35249.949, "args": { "External id": 22697,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 5288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651909578.734, "dur": 9.541, "args": { "External id": 22698,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 5289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651909581.785, "dur": 6.208, "args": { "External id": 22699,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5290 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651909617.697, "dur": 334.226, "args": { "External id": 22700,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 5291 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651909644.890, "dur": 302.460, "args": { "External id": 22701,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5292, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651909655.693, "dur": 286.272, "args": { "External id": 22702,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 5293 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651909970.830, "dur": 2.079, "args": { "External id": 22703,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5294, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910083.602, "dur": 6.991, "args": { "External id": 22704,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910139.246, "dur": 1.540, "args": { "External id": 22705,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910155.438, "dur": 1.627, "args": { "External id": 22706,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910167.505, "dur": 0.981, "args": { "External id": 22707,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910179.284, "dur": 0.884, "args": { "External id": 22708,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910189.743, "dur": 0.626, "args": { "External id": 22709,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910200.137, "dur": 0.699, "args": { "External id": 22710,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910214.752, "dur": 1.531, "args": { "External id": 22711,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910225.296, "dur": 0.871, "args": { "External id": 22712,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5303 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651910343.771, "dur": 2609.615, "args": { "External id": 22713,"Record function id": 0, "Ev Idx": 5304 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.2)", "pid": 1336759, "tid": 1381173, "ts": 1295651910363.253, "dur": 1016.879, "args": { "External id": 22714,"Record function id": 0, "Ev Idx": 5305 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.2)", "pid": 1336759, "tid": 1381173, "ts": 1295651910382.026, "dur": 304.136, "args": { "External id": 22715,"Record function id": 0, "Ev Idx": 5306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651910455.850, "dur": 4.871, "args": { "External id": 22716,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651910465.364, "dur": 0.864, "args": { "External id": 22717,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651910467.847, "dur": 0.942, "args": { "External id": 22718,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651910470.193, "dur": 1.268, "args": { "External id": 22719,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651910473.101, "dur": 6.519, "args": { "External id": 22720,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651910482.275, "dur": 0.478, "args": { "External id": 22721,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651910484.304, "dur": 1.515, "args": { "External id": 22722,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651910487.326, "dur": 0.564, "args": { "External id": 22723,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651910489.146, "dur": 0.555, "args": { "External id": 22724,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651910492.392, "dur": 1.606, "args": { "External id": 22725,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5316 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651910512.424, "dur": 146.019, "args": { "External id": 22726,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651910527.806, "dur": 126.457, "args": { "External id": 22727,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651910548.013, "dur": 12.807, "args": { "External id": 22728,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651910563.923, "dur": 65.203, "args": { "External id": 22729,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 5320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651910566.872, "dur": 61.873, "args": { "External id": 22730,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 5321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910570.774, "dur": 5.381, "args": { "External id": 22731,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651910577.788, "dur": 50.250, "args": { "External id": 22732,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 5323 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.1", "pid": 1336759, "tid": 1381173, "ts": 1295651910764.573, "dur": 604.272, "args": { "External id": 22733,"Record function id": 0, "Ev Idx": 5324 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.1)", "pid": 1336759, "tid": 1381173, "ts": 1295651910781.097, "dur": 575.529, "args": { "External id": 22734,"Record function id": 0, "Ev Idx": 5325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651910835.779, "dur": 4.954, "args": { "External id": 22735,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651910863.794, "dur": 19.938, "args": { "External id": 22736,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910869.618, "dur": 1.644, "args": { "External id": 22737,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910872.460, "dur": 0.275, "args": { "External id": 22738,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910873.789, "dur": 0.309, "args": { "External id": 22739,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910874.778, "dur": 0.166, "args": { "External id": 22740,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910875.497, "dur": 0.553, "args": { "External id": 22741,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910877.401, "dur": 0.256, "args": { "External id": 22742,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910878.389, "dur": 0.158, "args": { "External id": 22743,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910879.070, "dur": 0.186, "args": { "External id": 22744,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910880.545, "dur": 0.421, "args": { "External id": 22745,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651910892.167, "dur": 30.972, "args": { "External id": 22746,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5337 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651910952.832, "dur": 143.602, "args": { "External id": 22747,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 5338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651910961.812, "dur": 2.861, "args": { "External id": 22748,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651910972.938, "dur": 47.971, "args": { "External id": 22749,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651910977.068, "dur": 43.294, "args": { "External id": 22750,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 5341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651910980.178, "dur": 37.812, "args": { "External id": 22751,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651911031.186, "dur": 23.194, "args": { "External id": 22752,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651911033.440, "dur": 0.707, "args": { "External id": 22753,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651911035.391, "dur": 0.578, "args": { "External id": 22754,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651911037.078, "dur": 0.267, "args": { "External id": 22755,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651911038.490, "dur": 0.625, "args": { "External id": 22756,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651911040.666, "dur": 0.574, "args": { "External id": 22757,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651911042.272, "dur": 0.250, "args": { "External id": 22758,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651911046.141, "dur": 0.223, "args": { "External id": 22759,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651911047.433, "dur": 0.627, "args": { "External id": 22760,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651911049.334, "dur": 0.411, "args": { "External id": 22761,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651911064.164, "dur": 24.269, "args": { "External id": 22762,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5353 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651911144.321, "dur": 137.092, "args": { "External id": 22763,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 5354 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651911170.297, "dur": 107.383, "args": { "External id": 22764,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5355, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651911178.778, "dur": 94.574, "args": { "External id": 22765,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 5356 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651911298.637, "dur": 1.914, "args": { "External id": 22766,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5357, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651911386.958, "dur": 1546.437, "args": { "External id": 22767,"Sequence number": 246546, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5358 } }, { "ph": "f", "id": 222, "pid": 1336759, "tid": 1381173, "ts": 1295651911386.958, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651911496.309, "dur": 106.993, "args": { "External id": 22768,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 5359 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651911640.256, "dur": 36.140, "args": { "External id": 22769,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 5360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651911695.307, "dur": 50.857, "args": { "External id": 22770,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 5361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651911755.755, "dur": 31.936, "args": { "External id": 22771,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651911794.712, "dur": 44.210, "args": { "External id": 22772,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651911846.293, "dur": 28.332, "args": { "External id": 22773,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651911881.001, "dur": 43.837, "args": { "External id": 22774,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5365 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651911947.033, "dur": 21.229, "args": { "External id": 22775,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 5366 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651912026.966, "dur": 30.945, "args": { "External id": 22776,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5367 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651912080.918, "dur": 19.590, "args": { "External id": 22777,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5368 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651912114.646, "dur": 13.990, "args": { "External id": 22778,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651912137.359, "dur": 31.832, "args": { "External id": 22779,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651912172.617, "dur": 33.124, "args": { "External id": 22780,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5371 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651912244.980, "dur": 165.651, "args": { "External id": 22781,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 5372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651912322.301, "dur": 6.736, "args": { "External id": 22782,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651912331.245, "dur": 2.003, "args": { "External id": 22783,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5374 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651912443.108, "dur": 25.225, "args": { "External id": 22784,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5375 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651912480.445, "dur": 13.208, "args": { "External id": 22785,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651912501.741, "dur": 40.388, "args": { "External id": 22786,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651912548.608, "dur": 34.985, "args": { "External id": 22787,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651912589.954, "dur": 19.845, "args": { "External id": 22788,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651912614.308, "dur": 29.586, "args": { "External id": 22789,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651912649.611, "dur": 19.445, "args": { "External id": 22790,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651912675.103, "dur": 28.475, "args": { "External id": 22791,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5382 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651912723.654, "dur": 21.642, "args": { "External id": 22792,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 5383 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651912780.982, "dur": 28.286, "args": { "External id": 22793,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5384 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651912826.454, "dur": 20.464, "args": { "External id": 22794,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5385 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651912861.832, "dur": 13.389, "args": { "External id": 22795,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5386 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651912888.338, "dur": 17.686, "args": { "External id": 22796,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 5387 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651912975.457, "dur": 57.639, "args": { "External id": 22797,"Record function id": 0, "Ev Idx": 5388 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651912978.973, "dur": 52.406, "args": { "External id": 22798,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651912983.137, "dur": 46.694, "args": { "External id": 22799,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5390 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651913024.608, "dur": 4.897, "args": { "External id": 22800,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5391 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651913039.576, "dur": 6.093, "args": { "External id": 22801,"Record function id": 0, "Ev Idx": 5392 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651913041.587, "dur": 3.619, "args": { "External id": 22802,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651913042.816, "dur": 1.818, "args": { "External id": 22803,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5394 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651913043.638, "dur": 0.896, "args": { "External id": 22804,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5395 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651913049.254, "dur": 3.967, "args": { "External id": 22805,"Record function id": 0, "Ev Idx": 5396 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651913050.344, "dur": 2.443, "args": { "External id": 22806,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651913051.088, "dur": 1.254, "args": { "External id": 22807,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5398 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651913051.661, "dur": 0.576, "args": { "External id": 22808,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5399 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651913056.388, "dur": 3.814, "args": { "External id": 22809,"Record function id": 0, "Ev Idx": 5400 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651913057.636, "dur": 2.129, "args": { "External id": 22810,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651913058.164, "dur": 1.115, "args": { "External id": 22811,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5402 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651913058.611, "dur": 0.560, "args": { "External id": 22812,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5403 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651913063.220, "dur": 7.184, "args": { "External id": 22813,"Record function id": 0, "Ev Idx": 5404 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651913068.152, "dur": 1.844, "args": { "External id": 22814,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651913068.625, "dur": 0.932, "args": { "External id": 22815,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5406 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651913068.896, "dur": 0.587, "args": { "External id": 22816,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5407 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651913073.474, "dur": 3.724, "args": { "External id": 22817,"Record function id": 0, "Ev Idx": 5408 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651913074.425, "dur": 2.365, "args": { "External id": 22818,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651913074.882, "dur": 1.448, "args": { "External id": 22819,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5410 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651913075.431, "dur": 0.836, "args": { "External id": 22820,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5411 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651913080.402, "dur": 3.491, "args": { "External id": 22821,"Record function id": 0, "Ev Idx": 5412 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651913081.458, "dur": 2.024, "args": { "External id": 22822,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651913082.121, "dur": 0.907, "args": { "External id": 22823,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5414 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651913082.411, "dur": 0.558, "args": { "External id": 22824,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5415 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651913086.922, "dur": 4.664, "args": { "External id": 22825,"Record function id": 0, "Ev Idx": 5416 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651913087.902, "dur": 3.294, "args": { "External id": 22826,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651913088.339, "dur": 2.403, "args": { "External id": 22827,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5418 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651913090.125, "dur": 0.551, "args": { "External id": 22828,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5419 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651913094.646, "dur": 3.691, "args": { "External id": 22829,"Record function id": 0, "Ev Idx": 5420 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651913095.673, "dur": 2.254, "args": { "External id": 22830,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651913096.125, "dur": 1.273, "args": { "External id": 22831,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5422 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651913096.678, "dur": 0.647, "args": { "External id": 22832,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5423 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651913101.880, "dur": 36308.918, "args": { "External id": 22833,"Record function id": 0, "Sequence number": 246545, "Fwd thread id": 1, "Ev Idx": 5424 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651913103.294, "dur": 36298.752, "args": { "External id": 22834,"Sequence number": 246545, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5425 } }, { "ph": "f", "id": 223, "pid": 1336759, "tid": 1381173, "ts": 1295651913103.294, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.2)", "pid": 1336759, "tid": 1381173, "ts": 1295651913135.909, "dur": 38.104, "args": { "External id": 22835,"Record function id": 0, "Ev Idx": 5426 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.2)", "pid": 1336759, "tid": 1381173, "ts": 1295651913185.511, "dur": 84.712, "args": { "External id": 22836,"Record function id": 0, "Ev Idx": 5427 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.2)", "pid": 1336759, "tid": 1381173, "ts": 1295651913277.836, "dur": 36116.427, "args": { "External id": 22837,"Record function id": 0, "Ev Idx": 5428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651913369.723, "dur": 7.393, "args": { "External id": 22838,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651913387.604, "dur": 5.362, "args": { "External id": 22839,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5430 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651913409.183, "dur": 35059.684, "args": { "External id": 22840,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651913422.116, "dur": 35037.907, "args": { "External id": 22841,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651913460.328, "dur": 16.729, "args": { "External id": 22842,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651913483.284, "dur": 34940.958, "args": { "External id": 22843,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 5434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651913486.290, "dur": 34937.305, "args": { "External id": 22844,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 5435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651913489.850, "dur": 5.626, "args": { "External id": 22845,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651913497.410, "dur": 34922.594, "args": { "External id": 22846,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 5437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651948560.615, "dur": 8.757, "args": { "External id": 22847,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 5438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651948563.441, "dur": 5.641, "args": { "External id": 22848,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5439 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651948595.843, "dur": 480.233, "args": { "External id": 22849,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 5440 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651948626.971, "dur": 443.595, "args": { "External id": 22850,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5441, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651948638.011, "dur": 426.263, "args": { "External id": 22851,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 5442 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651949100.275, "dur": 2.092, "args": { "External id": 22852,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5443, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949168.952, "dur": 6.773, "args": { "External id": 22853,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949222.024, "dur": 1.859, "args": { "External id": 22854,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949258.509, "dur": 1.440, "args": { "External id": 22855,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949271.874, "dur": 0.844, "args": { "External id": 22856,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949281.816, "dur": 0.958, "args": { "External id": 22857,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949291.754, "dur": 0.653, "args": { "External id": 22858,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949302.387, "dur": 1.178, "args": { "External id": 22859,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949314.298, "dur": 0.781, "args": { "External id": 22860,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949323.690, "dur": 1.704, "args": { "External id": 22861,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5452 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651949426.228, "dur": 2635.507, "args": { "External id": 22862,"Record function id": 0, "Ev Idx": 5453 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.1)", "pid": 1336759, "tid": 1381173, "ts": 1295651949444.445, "dur": 1002.780, "args": { "External id": 22863,"Record function id": 0, "Ev Idx": 5454 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.1)", "pid": 1336759, "tid": 1381173, "ts": 1295651949460.857, "dur": 311.311, "args": { "External id": 22864,"Record function id": 0, "Ev Idx": 5455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651949537.069, "dur": 4.463, "args": { "External id": 22865,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651949544.679, "dur": 0.995, "args": { "External id": 22866,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651949547.507, "dur": 1.185, "args": { "External id": 22867,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651949550.753, "dur": 1.111, "args": { "External id": 22868,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651949553.532, "dur": 1.175, "args": { "External id": 22869,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651949558.256, "dur": 0.549, "args": { "External id": 22870,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651949560.421, "dur": 1.356, "args": { "External id": 22871,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651949563.278, "dur": 0.987, "args": { "External id": 22872,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651949565.475, "dur": 0.705, "args": { "External id": 22873,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651949569.604, "dur": 1.058, "args": { "External id": 22874,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5465 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651949589.025, "dur": 155.198, "args": { "External id": 22875,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651949603.770, "dur": 136.311, "args": { "External id": 22876,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651949627.680, "dur": 13.353, "args": { "External id": 22877,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651949644.308, "dur": 69.548, "args": { "External id": 22878,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 5469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651949647.217, "dur": 66.250, "args": { "External id": 22879,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 5470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949651.378, "dur": 5.783, "args": { "External id": 22880,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651949658.930, "dur": 53.944, "args": { "External id": 22881,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 5472 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.0", "pid": 1336759, "tid": 1381173, "ts": 1295651949853.641, "dur": 586.235, "args": { "External id": 22882,"Record function id": 0, "Ev Idx": 5473 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.0)", "pid": 1336759, "tid": 1381173, "ts": 1295651949869.181, "dur": 558.079, "args": { "External id": 22883,"Record function id": 0, "Ev Idx": 5474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651949923.774, "dur": 4.386, "args": { "External id": 22884,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651949943.737, "dur": 22.960, "args": { "External id": 22885,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949948.377, "dur": 1.278, "args": { "External id": 22886,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949951.953, "dur": 0.642, "args": { "External id": 22887,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949954.257, "dur": 0.310, "args": { "External id": 22888,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949955.501, "dur": 0.581, "args": { "External id": 22889,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949957.628, "dur": 0.296, "args": { "External id": 22890,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949959.014, "dur": 0.305, "args": { "External id": 22891,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949960.334, "dur": 0.602, "args": { "External id": 22892,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949962.426, "dur": 0.440, "args": { "External id": 22893,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651949963.704, "dur": 0.288, "args": { "External id": 22894,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651949975.505, "dur": 74.487, "args": { "External id": 22895,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5486 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1381173, "ts": 1295651950085.859, "dur": 93.659, "args": { "External id": 22896,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 5487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651950096.076, "dur": 4.196, "args": { "External id": 22897,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1381173, "ts": 1295651950105.417, "dur": 10.452, "args": { "External id": 22898,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1381173, "ts": 1295651950109.607, "dur": 5.860, "args": { "External id": 22899,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 5490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651950113.212, "dur": 0.708, "args": { "External id": 22900,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1381173, "ts": 1295651950122.739, "dur": 21.373, "args": { "External id": 22901,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651950124.557, "dur": 0.535, "args": { "External id": 22902,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651950126.659, "dur": 0.174, "args": { "External id": 22903,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651950128.063, "dur": 0.582, "args": { "External id": 22904,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651950130.067, "dur": 0.695, "args": { "External id": 22905,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651950132.525, "dur": 0.398, "args": { "External id": 22906,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651950133.849, "dur": 0.434, "args": { "External id": 22907,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651950135.036, "dur": 0.355, "args": { "External id": 22908,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651950136.851, "dur": 0.689, "args": { "External id": 22909,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651950138.747, "dur": 0.182, "args": { "External id": 22910,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651950153.516, "dur": 18.625, "args": { "External id": 22911,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5502 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651950223.374, "dur": 134.629, "args": { "External id": 22912,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 5503 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651950268.165, "dur": 85.833, "args": { "External id": 22913,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5504, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1381173, "ts": 1295651950278.599, "dur": 71.451, "args": { "External id": 22914,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 5505 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651950373.757, "dur": 1.729, "args": { "External id": 22915,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5506, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651950454.833, "dur": 1586.306, "args": { "External id": 22916,"Sequence number": 246544, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5507 } }, { "ph": "f", "id": 224, "pid": 1336759, "tid": 1381173, "ts": 1295651950454.833, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651950563.139, "dur": 108.838, "args": { "External id": 22917,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 5508 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651950713.730, "dur": 37.430, "args": { "External id": 22918,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 5509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651950769.073, "dur": 50.370, "args": { "External id": 22919,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 5510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651950829.542, "dur": 32.174, "args": { "External id": 22920,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651950868.034, "dur": 47.489, "args": { "External id": 22921,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651950922.918, "dur": 29.823, "args": { "External id": 22922,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651950959.788, "dur": 77.040, "args": { "External id": 22923,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5514 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651951069.538, "dur": 21.923, "args": { "External id": 22924,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 5515 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651951112.410, "dur": 26.625, "args": { "External id": 22925,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5516 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651951159.216, "dur": 21.025, "args": { "External id": 22926,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5517 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651951194.588, "dur": 14.599, "args": { "External id": 22927,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651951216.692, "dur": 50.909, "args": { "External id": 22928,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651951272.733, "dur": 37.025, "args": { "External id": 22929,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5520 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651951341.098, "dur": 168.306, "args": { "External id": 22930,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 5521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651951421.083, "dur": 5.803, "args": { "External id": 22931,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651951428.803, "dur": 1.864, "args": { "External id": 22932,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5523 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651951539.097, "dur": 23.041, "args": { "External id": 22933,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5524 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651951573.189, "dur": 13.881, "args": { "External id": 22934,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651951595.685, "dur": 32.542, "args": { "External id": 22935,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651951634.179, "dur": 32.671, "args": { "External id": 22936,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651951672.599, "dur": 20.156, "args": { "External id": 22937,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651951697.336, "dur": 28.739, "args": { "External id": 22938,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651951732.555, "dur": 19.302, "args": { "External id": 22939,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651951757.492, "dur": 28.520, "args": { "External id": 22940,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5531 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651951801.895, "dur": 20.962, "args": { "External id": 22941,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 5532 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651951842.363, "dur": 37.231, "args": { "External id": 22942,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5533 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651951899.438, "dur": 15.869, "args": { "External id": 22943,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5534 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651951930.110, "dur": 12.705, "args": { "External id": 22944,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5535 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651951958.036, "dur": 14.786, "args": { "External id": 22945,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 5536 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952084.918, "dur": 15.251, "args": { "External id": 22946,"Record function id": 0, "Ev Idx": 5537 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952088.443, "dur": 10.691, "args": { "External id": 22947,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952092.648, "dur": 5.613, "args": { "External id": 22948,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5539 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952094.143, "dur": 4.007, "args": { "External id": 22949,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5540 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952104.043, "dur": 4.825, "args": { "External id": 22950,"Record function id": 0, "Ev Idx": 5541 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952105.580, "dur": 2.881, "args": { "External id": 22951,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952106.433, "dur": 1.562, "args": { "External id": 22952,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5543 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952107.021, "dur": 0.872, "args": { "External id": 22953,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5544 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952111.979, "dur": 4.071, "args": { "External id": 22954,"Record function id": 0, "Ev Idx": 5545 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952113.205, "dur": 2.389, "args": { "External id": 22955,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952113.708, "dur": 1.449, "args": { "External id": 22956,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5547 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952114.415, "dur": 0.633, "args": { "External id": 22957,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5548 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952119.213, "dur": 4.150, "args": { "External id": 22958,"Record function id": 0, "Ev Idx": 5549 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952120.188, "dur": 2.765, "args": { "External id": 22959,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952120.940, "dur": 1.588, "args": { "External id": 22960,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5551 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952121.250, "dur": 1.198, "args": { "External id": 22961,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5552 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952126.496, "dur": 4.277, "args": { "External id": 22962,"Record function id": 0, "Ev Idx": 5553 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952127.647, "dur": 2.665, "args": { "External id": 22963,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952128.413, "dur": 1.440, "args": { "External id": 22964,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5555 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952128.886, "dur": 0.899, "args": { "External id": 22965,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5556 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952134.008, "dur": 3.927, "args": { "External id": 22966,"Record function id": 0, "Ev Idx": 5557 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952135.204, "dur": 2.328, "args": { "External id": 22967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952135.746, "dur": 1.373, "args": { "External id": 22968,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5559 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952136.206, "dur": 0.846, "args": { "External id": 22969,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5560 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952140.999, "dur": 3.637, "args": { "External id": 22970,"Record function id": 0, "Ev Idx": 5561 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952142.158, "dur": 2.061, "args": { "External id": 22971,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952142.657, "dur": 1.108, "args": { "External id": 22972,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5563 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952142.929, "dur": 0.770, "args": { "External id": 22973,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5564 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952147.593, "dur": 3.905, "args": { "External id": 22974,"Record function id": 0, "Ev Idx": 5565 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952148.803, "dur": 2.261, "args": { "External id": 22975,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952149.324, "dur": 1.310, "args": { "External id": 22976,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5567 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952149.589, "dur": 0.976, "args": { "External id": 22977,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5568 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952154.458, "dur": 4.912, "args": { "External id": 22978,"Record function id": 0, "Ev Idx": 5569 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651952155.578, "dur": 3.384, "args": { "External id": 22979,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952156.110, "dur": 2.450, "args": { "External id": 22980,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5571 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651952157.658, "dur": 0.780, "args": { "External id": 22981,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5572 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651952162.855, "dur": 35336.230, "args": { "External id": 22982,"Record function id": 0, "Sequence number": 246543, "Fwd thread id": 1, "Ev Idx": 5573 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651952164.424, "dur": 35325.911, "args": { "External id": 22983,"Sequence number": 246543, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5574 } }, { "ph": "f", "id": 225, "pid": 1336759, "tid": 1381173, "ts": 1295651952164.424, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.1)", "pid": 1336759, "tid": 1381173, "ts": 1295651952191.828, "dur": 54.433, "args": { "External id": 22984,"Record function id": 0, "Ev Idx": 5575 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.1)", "pid": 1336759, "tid": 1381173, "ts": 1295651952256.399, "dur": 67.864, "args": { "External id": 22985,"Record function id": 0, "Ev Idx": 5576 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.1)", "pid": 1336759, "tid": 1381173, "ts": 1295651952333.748, "dur": 35148.828, "args": { "External id": 22986,"Record function id": 0, "Ev Idx": 5577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651952424.690, "dur": 7.252, "args": { "External id": 22987,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651952441.897, "dur": 5.408, "args": { "External id": 22988,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5579 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651952461.765, "dur": 34222.570, "args": { "External id": 22989,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651952478.351, "dur": 34197.456, "args": { "External id": 22990,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651952518.244, "dur": 14.923, "args": { "External id": 22991,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651952539.427, "dur": 34096.708, "args": { "External id": 22992,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 5583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651952543.817, "dur": 34091.659, "args": { "External id": 22993,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 5584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651952547.074, "dur": 5.084, "args": { "External id": 22994,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651952553.746, "dur": 34078.198, "args": { "External id": 22995,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 5586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295651986772.623, "dur": 9.318, "args": { "External id": 22996,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 5587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651986775.613, "dur": 5.988, "args": { "External id": 22997,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5588 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295651986809.469, "dur": 382.501, "args": { "External id": 22998,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 5589 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651986838.003, "dur": 348.712, "args": { "External id": 22999,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5590, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295651986849.383, "dur": 331.289, "args": { "External id": 23000,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 5591 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295651987214.057, "dur": 2.468, "args": { "External id": 23001,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5592, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651987293.619, "dur": 6.845, "args": { "External id": 23002,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651987343.700, "dur": 1.393, "args": { "External id": 23003,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651987359.661, "dur": 0.924, "args": { "External id": 23004,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651987370.718, "dur": 0.925, "args": { "External id": 23005,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651987382.169, "dur": 0.914, "args": { "External id": 23006,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651987392.140, "dur": 0.753, "args": { "External id": 23007,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651987402.353, "dur": 0.857, "args": { "External id": 23008,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651987412.535, "dur": 1.115, "args": { "External id": 23009,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651987422.383, "dur": 0.929, "args": { "External id": 23010,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5601 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651987513.967, "dur": 2065.535, "args": { "External id": 23011,"Record function id": 0, "Ev Idx": 5602 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.0)", "pid": 1336759, "tid": 1381173, "ts": 1295651987532.269, "dur": 408.097, "args": { "External id": 23012,"Record function id": 0, "Ev Idx": 5603 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.0)", "pid": 1336759, "tid": 1381173, "ts": 1295651987548.240, "dur": 308.067, "args": { "External id": 23013,"Record function id": 0, "Ev Idx": 5604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651987625.757, "dur": 4.002, "args": { "External id": 23014,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651987633.589, "dur": 1.217, "args": { "External id": 23015,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651987636.917, "dur": 1.624, "args": { "External id": 23016,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651987640.326, "dur": 0.768, "args": { "External id": 23017,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651987642.593, "dur": 1.213, "args": { "External id": 23018,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651987646.135, "dur": 1.379, "args": { "External id": 23019,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651987649.311, "dur": 6.333, "args": { "External id": 23020,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651987657.730, "dur": 0.422, "args": { "External id": 23021,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651987659.633, "dur": 1.086, "args": { "External id": 23022,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651987663.589, "dur": 0.558, "args": { "External id": 23023,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5614 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651987681.752, "dur": 147.596, "args": { "External id": 23024,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651987699.301, "dur": 125.686, "args": { "External id": 23025,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651987718.428, "dur": 12.782, "args": { "External id": 23026,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651987734.557, "dur": 65.023, "args": { "External id": 23027,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 5618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651987737.301, "dur": 61.953, "args": { "External id": 23028,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 5619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651987741.536, "dur": 5.247, "args": { "External id": 23029,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651987748.773, "dur": 49.857, "args": { "External id": 23030,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 5621 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651987947.082, "dur": 1612.609, "args": { "External id": 23031,"Sequence number": 246542, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5622 } }, { "ph": "f", "id": 226, "pid": 1336759, "tid": 1381173, "ts": 1295651987947.082, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651988098.420, "dur": 108.417, "args": { "External id": 23032,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 5623 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336759, "tid": 1381173, "ts": 1295651988261.841, "dur": 40.555, "args": { "External id": 23033,"kernel_hash": "cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/m5/cm5os3r6hv7ysipdpiairo6lyepmpaszxgfbktm3djkrvim3pzmx.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 5624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336759, "tid": 1381173, "ts": 1295651988320.933, "dur": 51.365, "args": { "External id": 23034,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 5625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651988381.236, "dur": 31.813, "args": { "External id": 23035,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651988420.181, "dur": 44.948, "args": { "External id": 23036,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651988472.568, "dur": 26.649, "args": { "External id": 23037,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651988505.877, "dur": 44.764, "args": { "External id": 23038,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5629 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336759, "tid": 1381173, "ts": 1295651988574.293, "dur": 22.849, "args": { "External id": 23039,"kernel_hash": "c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/47/c47x727mhg3ctiwzlmxagokbourh3jzbxm2pk4af4zajlvil6mbi.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 5630 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336759, "tid": 1381173, "ts": 1295651988614.124, "dur": 30.497, "args": { "External id": 23040,"kernel_hash": "cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/xr/cxrz26z2x5pfml2f2w22jccdkyygktk5hbwlaypdvvhkn4fqlm5d.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5631 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651988686.452, "dur": 20.947, "args": { "External id": 23041,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5632 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651988720.409, "dur": 13.567, "args": { "External id": 23042,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651988741.864, "dur": 27.611, "args": { "External id": 23043,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651988772.762, "dur": 31.965, "args": { "External id": 23044,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5635 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336759, "tid": 1381173, "ts": 1295651988830.268, "dur": 203.298, "args": { "External id": 23045,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 5636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651988905.377, "dur": 5.659, "args": { "External id": 23046,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651988912.875, "dur": 2.432, "args": { "External id": 23047,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5638 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651989068.021, "dur": 27.065, "args": { "External id": 23048,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5639 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1381173, "ts": 1295651989106.630, "dur": 13.126, "args": { "External id": 23049,"kernel_hash": "c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/6o/c6otstk2ryxkcc2uxmrjmab44n43krf6sqcczamirphtzygmmb65.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651989128.499, "dur": 39.123, "args": { "External id": 23050,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651989173.555, "dur": 35.300, "args": { "External id": 23051,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5642 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651989215.689, "dur": 39.045, "args": { "External id": 23052,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651989263.048, "dur": 32.784, "args": { "External id": 23053,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651989305.232, "dur": 19.398, "args": { "External id": 23054,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1381173, "ts": 1295651989331.405, "dur": 28.990, "args": { "External id": 23055,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5646 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336759, "tid": 1381173, "ts": 1295651989379.151, "dur": 23.323, "args": { "External id": 23056,"kernel_hash": "cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/g4/cg4ukr25hvc6fhe6tywzzdige4qswrvbmpfxtd3w73o2rbqqnxdc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 5647 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336759, "tid": 1381173, "ts": 1295651989422.340, "dur": 22.803, "args": { "External id": 23057,"kernel_hash": "c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4n/c4n3ou2ncjbisanhyo3hqtp5omwwxz2moubkkc2nbkm4ze4hfkis.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5648 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336759, "tid": 1381173, "ts": 1295651989458.632, "dur": 19.190, "args": { "External id": 23058,"kernel_hash": "co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/o6/co6fecdb2uywcxfuxcz5nj3kv5higyqx2aburlbzi3bvynrhar7n.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5649 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336759, "tid": 1381173, "ts": 1295651989491.848, "dur": 13.408, "args": { "External id": 23059,"kernel_hash": "c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/35/c35ivrp4vzea2wu6fb3b63szlroo6fc5n7miteort3yhwxwmfsty.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5650 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336759, "tid": 1381173, "ts": 1295651989517.273, "dur": 14.699, "args": { "External id": 23060,"kernel_hash": "cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u7/cu7quhizahhnunbe25uov4qu4xq6kfyaol7a4xbozhkfrtszumjz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 5651 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989602.518, "dur": 14.926, "args": { "External id": 23061,"Record function id": 0, "Ev Idx": 5652 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989605.816, "dur": 10.700, "args": { "External id": 23062,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989610.191, "dur": 5.496, "args": { "External id": 23063,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5654 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989611.438, "dur": 4.123, "args": { "External id": 23064,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5655 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989621.316, "dur": 7.979, "args": { "External id": 23065,"Record function id": 0, "Ev Idx": 5656 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989622.638, "dur": 6.211, "args": { "External id": 23066,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989623.402, "dur": 4.974, "args": { "External id": 23067,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5658 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989623.947, "dur": 4.336, "args": { "External id": 23068,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5659 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989632.655, "dur": 4.265, "args": { "External id": 23069,"Record function id": 0, "Ev Idx": 5660 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989634.254, "dur": 2.215, "args": { "External id": 23070,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989634.726, "dur": 1.345, "args": { "External id": 23071,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5662 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989635.197, "dur": 0.763, "args": { "External id": 23072,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5663 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989640.232, "dur": 4.644, "args": { "External id": 23073,"Record function id": 0, "Ev Idx": 5664 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989642.099, "dur": 2.317, "args": { "External id": 23074,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989642.780, "dur": 1.159, "args": { "External id": 23075,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5666 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989643.200, "dur": 0.660, "args": { "External id": 23076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5667 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989647.852, "dur": 4.098, "args": { "External id": 23077,"Record function id": 0, "Ev Idx": 5668 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989649.125, "dur": 2.395, "args": { "External id": 23078,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989649.975, "dur": 1.105, "args": { "External id": 23079,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5670 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989650.342, "dur": 0.670, "args": { "External id": 23080,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5671 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989654.992, "dur": 5.135, "args": { "External id": 23081,"Record function id": 0, "Ev Idx": 5672 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989656.292, "dur": 3.401, "args": { "External id": 23082,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989656.991, "dur": 2.247, "args": { "External id": 23083,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5674 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989658.680, "dur": 0.453, "args": { "External id": 23084,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5675 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989663.200, "dur": 4.063, "args": { "External id": 23085,"Record function id": 0, "Ev Idx": 5676 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989664.512, "dur": 2.344, "args": { "External id": 23086,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5677 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989665.011, "dur": 1.430, "args": { "External id": 23087,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5678 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989665.649, "dur": 0.710, "args": { "External id": 23088,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5679 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989670.280, "dur": 3.956, "args": { "External id": 23089,"Record function id": 0, "Ev Idx": 5680 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989671.615, "dur": 2.203, "args": { "External id": 23090,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989672.115, "dur": 1.301, "args": { "External id": 23091,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5682 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989672.596, "dur": 0.757, "args": { "External id": 23092,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5683 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989677.177, "dur": 4.425, "args": { "External id": 23093,"Record function id": 0, "Ev Idx": 5684 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295651989678.458, "dur": 2.708, "args": { "External id": 23094,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989678.895, "dur": 1.883, "args": { "External id": 23095,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5686 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295651989679.422, "dur": 1.291, "args": { "External id": 23096,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5687 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651989689.122, "dur": 35710.746, "args": { "External id": 23097,"Record function id": 0, "Sequence number": 246541, "Fwd thread id": 1, "Ev Idx": 5688 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295651989690.258, "dur": 35700.543, "args": { "External id": 23098,"Sequence number": 246541, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5689 } }, { "ph": "f", "id": 227, "pid": 1336759, "tid": 1381173, "ts": 1295651989690.258, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.0)", "pid": 1336759, "tid": 1381173, "ts": 1295651989718.498, "dur": 41.550, "args": { "External id": 23099,"Record function id": 0, "Ev Idx": 5690 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.0)", "pid": 1336759, "tid": 1381173, "ts": 1295651989767.751, "dur": 68.379, "args": { "External id": 23100,"Record function id": 0, "Ev Idx": 5691 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.0)", "pid": 1336759, "tid": 1381173, "ts": 1295651989843.535, "dur": 35539.219, "args": { "External id": 23101,"Record function id": 0, "Ev Idx": 5692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651989933.807, "dur": 5.779, "args": { "External id": 23102,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295651989952.100, "dur": 4.939, "args": { "External id": 23103,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5694 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651989970.384, "dur": 34608.019, "args": { "External id": 23104,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295651989983.151, "dur": 34585.419, "args": { "External id": 23105,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295651990082.023, "dur": 16.305, "args": { "External id": 23106,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295651990104.913, "dur": 34427.856, "args": { "External id": 23107,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 5698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295651990107.518, "dur": 34424.596, "args": { "External id": 23108,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 5699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295651990110.994, "dur": 6.257, "args": { "External id": 23109,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295651990119.005, "dur": 34410.507, "args": { "External id": 23110,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 5701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295652024670.148, "dur": 9.100, "args": { "External id": 23111,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 5702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295652024672.843, "dur": 6.046, "args": { "External id": 23112,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5703 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295652024705.351, "dur": 369.141, "args": { "External id": 23113,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 5704 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295652024735.143, "dur": 334.061, "args": { "External id": 23114,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5705, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295652024745.771, "dur": 317.810, "args": { "External id": 23115,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 5706 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295652025096.989, "dur": 2.216, "args": { "External id": 23116,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5707, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652025161.862, "dur": 6.356, "args": { "External id": 23117,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652025212.716, "dur": 1.298, "args": { "External id": 23118,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652025244.178, "dur": 2.066, "args": { "External id": 23119,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652025262.201, "dur": 1.453, "args": { "External id": 23120,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652025275.489, "dur": 1.227, "args": { "External id": 23121,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652025286.013, "dur": 1.025, "args": { "External id": 23122,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652025297.682, "dur": 1.364, "args": { "External id": 23123,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652025309.402, "dur": 0.981, "args": { "External id": 23124,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652025319.019, "dur": 1.239, "args": { "External id": 23125,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5716 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295652025416.132, "dur": 255.608, "args": { "External id": 23126,"Record function id": 0, "Sequence number": 246540, "Fwd thread id": 1, "Ev Idx": 5717 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336759, "tid": 1381173, "ts": 1295652025419.060, "dur": 244.824, "args": { "External id": 23127,"Sequence number": 246540, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5718 } }, { "ph": "f", "id": 228, "pid": 1336759, "tid": 1381173, "ts": 1295652025419.060, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_dense_backward_0", "pid": 1336759, "tid": 1381173, "ts": 1295652025530.629, "dur": 44.484, "args": { "External id": 23128,"kernel_hash": "cqy2wwurxdpkuy27hkscegzor44hvby6k37yecnbppfr7quxx5hx", "grid": "grid(65536000,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "65536000"], "kernel_file": "/tmp/torchinductor_cvm/qy/cqy2wwurxdpkuy27hkscegzor44hvby6k37yecnbppfr7quxx5hx.py", "kernel_backend": "triton", "Input type": ["float", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[32000, 2048], []], "Ev Idx": 5719 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_dense_backward_1", "pid": 1336759, "tid": 1381173, "ts": 1295652025588.888, "dur": 24.745, "args": { "External id": 23129,"kernel_hash": "cdyaclk3pd7t6z6zuqzswmelsxchlewwniqxs4434hgglihydkpz", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/dy/cdyaclk3pd7t6z6zuqzswmelsxchlewwniqxs4434hgglihydkpz.py", "kernel_backend": "triton", "Input type": ["long int", "c10::BFloat16", "float", "Scalar"], "Input Strides": [[4096, 1], [8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096], [16, 4096, 2048], [32000, 2048], []], "Ev Idx": 5720 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_dense_backward_2", "pid": 1336759, "tid": 1381173, "ts": 1295652025629.924, "dur": 19.798, "args": { "External id": 23130,"kernel_hash": "cvyxdor6u3emsju5qmfjq37syr77ijvjswkrldbg6t62lvcr3cem", "grid": "grid(65536000,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "65536000"], "kernel_file": "/tmp/torchinductor_cvm/vy/cvyxdor6u3emsju5qmfjq37syr77ijvjswkrldbg6t62lvcr3cem.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 5721 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295652025681.104, "dur": 14.472, "args": { "External id": 23131,"Record function id": 0, "Ev Idx": 5722 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336759, "tid": 1381173, "ts": 1295652025684.275, "dur": 10.281, "args": { "External id": 23132,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 5723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1381173, "ts": 1295652025687.847, "dur": 5.902, "args": { "External id": 23133,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 5724 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1381173, "ts": 1295652025689.354, "dur": 4.266, "args": { "External id": 23134,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 5725 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::root_post_backward_callback", "pid": 1336759, "tid": 1381173, "ts": 1295652025714.378, "dur": 7135.515, "args": { "External id": 23135,"Record function id": 0, "Ev Idx": 5726 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate", "pid": 1336759, "tid": 1381173, "ts": 1295652025731.902, "dur": 30.668, "args": { "External id": 23136,"Record function id": 0, "Ev Idx": 5727 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard", "pid": 1336759, "tid": 1381173, "ts": 1295652025768.451, "dur": 198.237, "args": { "External id": 23137,"Record function id": 0, "Ev Idx": 5728 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce", "pid": 1336759, "tid": 1381173, "ts": 1295652025972.857, "dur": 6608.220, "args": { "External id": 23138,"Record function id": 0, "Ev Idx": 5729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295652026144.740, "dur": 7.536, "args": { "External id": 23139,"Record function id": 0, "Concrete Inputs": ["[336611328]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1381173, "ts": 1295652026163.003, "dur": 5.295, "args": { "External id": 23140,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[336611328], []], "Ev Idx": 5731 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295652026187.568, "dur": 5180.706, "args": { "External id": 23141,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[], [], [], [42076416, 1]], "Input Dims": [[], [], [], [8, 42076416]], "Ev Idx": 5732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336759, "tid": 1381173, "ts": 1295652026205.833, "dur": 5149.786, "args": { "External id": 23142,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[], [], [], [42076416, 1]], "Input Dims": [[], [], [], [8, 42076416]], "Ev Idx": 5733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295652026489.316, "dur": 21.449, "args": { "External id": 23143,"Record function id": 0, "Concrete Inputs": ["[82421]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1381173, "ts": 1295652026569.909, "dur": 4739.016, "args": { "External id": 23144,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[82421], [], [], [], [], [], [], []], "Ev Idx": 5735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1381173, "ts": 1295652026573.031, "dur": 4734.822, "args": { "External id": 23145,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[82421], [], [], [], [], [], []], "Ev Idx": 5736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652026577.265, "dur": 12.656, "args": { "External id": 23146,"Record function id": 0, "Concrete Inputs": ["[82421]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1381173, "ts": 1295652026592.312, "dur": 4709.773, "args": { "External id": 23147,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[82421], [82421], []], "Ev Idx": 5738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1381173, "ts": 1295652031495.641, "dur": 11.315, "args": { "External id": 23148,"Record function id": 0, "Concrete Inputs": ["", "[42076416]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[336611328], [], [], [], [], []], "Ev Idx": 5739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1381173, "ts": 1295652031498.994, "dur": 7.539, "args": { "External id": 23149,"Record function id": 0, "Concrete Inputs": ["[42076416]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5740 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336759, "tid": 1381173, "ts": 1295652031534.763, "dur": 414.629, "args": { "External id": 23150,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[42076416], [336611328], [], [], [], []], "Ev Idx": 5741 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295652031561.990, "dur": 383.076, "args": { "External id": 23151,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 42076416, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[336611328], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5742, "In msg nelems": 336611328 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336759, "tid": 1381173, "ts": 1295652031577.865, "dur": 362.426, "args": { "External id": 23152,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[336611328]], "Ev Idx": 5743 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1381173, "ts": 1295652031968.608, "dur": 2.122, "args": { "External id": 23153,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5744, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032064.010, "dur": 7.332, "args": { "External id": 23154,"Record function id": 0, "Concrete Inputs": ["", "[4000, 2048]", "[2048, 1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032113.843, "dur": 1.573, "args": { "External id": 23155,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8192000"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032129.487, "dur": 1.133, "args": { "External id": 23156,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "8192256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032141.944, "dur": 0.994, "args": { "External id": 23157,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "8716544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032153.480, "dur": 0.774, "args": { "External id": 23158,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "9240832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032162.547, "dur": 1.800, "args": { "External id": 23159,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "9765120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032176.523, "dur": 1.006, "args": { "External id": 23160,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "10289408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032187.352, "dur": 1.215, "args": { "External id": 23161,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "10289664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032198.787, "dur": 0.625, "args": { "External id": 23162,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "11731456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032207.534, "dur": 1.165, "args": { "External id": 23163,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "13173248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032217.305, "dur": 1.128, "args": { "External id": 23164,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "14615040"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032226.713, "dur": 1.102, "args": { "External id": 23165,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "14615296"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032257.829, "dur": 1.581, "args": { "External id": 23166,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "15139584"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032269.150, "dur": 1.163, "args": { "External id": 23167,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "15663872"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032279.357, "dur": 1.230, "args": { "External id": 23168,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "16188160"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032289.378, "dur": 1.108, "args": { "External id": 23169,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "16712448"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032298.936, "dur": 0.984, "args": { "External id": 23170,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "16712704"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032309.919, "dur": 0.940, "args": { "External id": 23171,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "18154496"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032319.101, "dur": 1.332, "args": { "External id": 23172,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "19596288"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032329.409, "dur": 0.974, "args": { "External id": 23173,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "21038080"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032339.940, "dur": 1.043, "args": { "External id": 23174,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "21038336"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032349.988, "dur": 0.984, "args": { "External id": 23175,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "21562624"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032359.207, "dur": 0.964, "args": { "External id": 23176,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "22086912"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032370.645, "dur": 1.395, "args": { "External id": 23177,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "22611200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032381.167, "dur": 0.800, "args": { "External id": 23178,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "23135488"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032390.097, "dur": 1.160, "args": { "External id": 23179,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "23135744"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032400.027, "dur": 0.773, "args": { "External id": 23180,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "24577536"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032409.408, "dur": 1.027, "args": { "External id": 23181,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "26019328"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032419.560, "dur": 1.061, "args": { "External id": 23182,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27461120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032430.074, "dur": 1.364, "args": { "External id": 23183,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "27461376"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032439.877, "dur": 1.064, "args": { "External id": 23184,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "27985664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032449.496, "dur": 1.361, "args": { "External id": 23185,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "28509952"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032458.406, "dur": 0.720, "args": { "External id": 23186,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "29034240"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032467.346, "dur": 1.254, "args": { "External id": 23187,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "29558528"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032478.911, "dur": 1.184, "args": { "External id": 23188,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "29558784"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032489.318, "dur": 1.086, "args": { "External id": 23189,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "31000576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032499.704, "dur": 1.072, "args": { "External id": 23190,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "32442368"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032509.264, "dur": 1.203, "args": { "External id": 23191,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "33884160"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1381173, "ts": 1295652032518.237, "dur": 0.586, "args": { "External id": 23192,"Record function id": 0, "Concrete Inputs": ["", "[4000, 2048]", "[2048, 1]", "33884416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5783 } }, { "ph": "X", "cat": "user_annotation", "name": "ProfilerStep#1023", "pid": 1336759, "tid": 1336759, "ts": 1295649886375.721, "dur": 2164047.907, "args": { "External id": 12289,"Record function id": 0, "Ev Idx": 5784 } }, { "ph": "X", "cat": "user_annotation", "name": "Optimizer.zero_grad#AdamW.zero_grad", "pid": 1336759, "tid": 1336759, "ts": 1295649886407.153, "dur": 526.955, "args": { "External id": 12290,"Record function id": 0, "Ev Idx": 5785 } }, { "ph": "X", "cat": "user_annotation", "name": "enumerate(DataLoader)#_StatefulMultiProcessingDataLoaderIter.__next__", "pid": 1336759, "tid": 1336759, "ts": 1295649886973.528, "dur": 1942.196, "args": { "External id": 12291,"Record function id": 0, "Ev Idx": 5786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649887937.522, "dur": 7.398, "args": { "External id": 12292,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::set_", "pid": 1336759, "tid": 1336759, "ts": 1295649887965.665, "dur": 7.410, "args": { "External id": 12293,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "0", "[16, 8192]", "[8192, 1]"], "Input type": ["long int", "", "Scalar", "ScalarList", "ScalarList"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[0], [], [], [], []], "Ev Idx": 5788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649888424.766, "dur": 2.837, "args": { "External id": 12294,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::set_", "pid": 1336759, "tid": 1336759, "ts": 1295649888435.485, "dur": 3.031, "args": { "External id": 12295,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "0", "[16, 8192]", "[8192, 1]"], "Input type": ["long int", "", "Scalar", "ScalarList", "ScalarList"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[0], [], [], [], []], "Ev Idx": 5790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649888811.331, "dur": 1.787, "args": { "External id": 12296,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::set_", "pid": 1336759, "tid": 1336759, "ts": 1295649888819.683, "dur": 1.793, "args": { "External id": 12297,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "0", "[16, 8192]", "[8192, 1]"], "Input type": ["long int", "", "Scalar", "ScalarList", "ScalarList"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[0], [], [], [], []], "Ev Idx": 5792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295649889463.364, "dur": 14.116, "args": { "External id": 12298,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], []], "Ev Idx": 5793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649889470.897, "dur": 2.795, "args": { "External id": 12299,"Record function id": 0, "Concrete Inputs": ["", "[16, 8192]", "[8192, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 5794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295649889479.056, "dur": 4.626, "args": { "External id": 12300,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "4096", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], []], "Ev Idx": 5795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649889481.348, "dur": 1.199, "args": { "External id": 12301,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 5796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295649889509.526, "dur": 459.382, "args": { "External id": 12302,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], [], [], []], "Ev Idx": 5797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649889516.727, "dur": 451.256, "args": { "External id": 12303,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], [], []], "Ev Idx": 5798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649889523.864, "dur": 10.040, "args": { "External id": 12304,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "[4096, 1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649889536.226, "dur": 430.364, "args": { "External id": 12305,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 5800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295649889546.265, "dur": 0.538, "args": { "External id": 12306,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 5801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::expand_as", "pid": 1336759, "tid": 1336759, "ts": 1295649889550.109, "dur": 9.186, "args": { "External id": 12307,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["long int", "long int"], "Input Strides": [[8192, 1], [4096, 1]], "Input Dims": [[16, 4096], [16, 4096]], "Ev Idx": 5802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::expand", "pid": 1336759, "tid": 1336759, "ts": 1295649889554.636, "dur": 4.502, "args": { "External id": 12308,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "False"], "Input type": ["long int", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], []], "Input Dims": [[16, 4096], [], []], "Ev Idx": 5803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649889558.017, "dur": 0.842, "args": { "External id": 12309,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 5804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336759, "tid": 1336759, "ts": 1295649889561.582, "dur": 181.861, "args": { "External id": 12310,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 5805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1336759, "ts": 1295649889564.152, "dur": 178.903, "args": { "External id": 12311,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 5806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295649889566.369, "dur": 15.285, "args": { "External id": 12312,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 5807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649889568.208, "dur": 12.896, "args": { "External id": 12313,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649889582.316, "dur": 160.416, "args": { "External id": 12314,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 5809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649889745.242, "dur": 218.491, "args": { "External id": 12315,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [4096, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 5810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295649890023.340, "dur": 477.430, "args": { "External id": 12316,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], [], [], [], []], "Ev Idx": 5811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649890025.167, "dur": 475.008, "args": { "External id": 12317,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], [], [], []], "Ev Idx": 5812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649890032.263, "dur": 9.338, "args": { "External id": 12318,"Record function id": 0, "Concrete Inputs": ["[16, 8192]", "[8192, 1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649890042.975, "dur": 453.431, "args": { "External id": 12319,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[8192, 1], [8192, 1], []], "Input Dims": [[16, 8192], [16, 8192], []], "Ev Idx": 5814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::arange", "pid": 1336759, "tid": 1336759, "ts": 1295649890533.610, "dur": 57.389, "args": { "External id": 12320,"Record function id": 0, "Concrete Inputs": ["0", "4096", "", "", "", "False"], "Input type": ["Scalar", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649890540.432, "dur": 5.974, "args": { "External id": 12321,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::arange", "pid": 1336759, "tid": 1336759, "ts": 1295649890549.779, "dur": 40.569, "args": { "External id": 12322,"Record function id": 0, "Concrete Inputs": ["0", "4096", "1", ""], "Input type": ["Scalar", "Scalar", "Scalar", "long int"], "Input Strides": [[], [], [], [1]], "Input Dims": [[], [], [], [0]], "Ev Idx": 5817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295649890555.916, "dur": 7.343, "args": { "External id": 12323,"Record function id": 0, "Concrete Inputs": ["", "[4096]", ""], "Input type": ["long int", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 5818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::repeat", "pid": 1336759, "tid": 1336759, "ts": 1295649890603.663, "dur": 68.107, "args": { "External id": 12324,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4096], []], "Ev Idx": 5819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::expand", "pid": 1336759, "tid": 1336759, "ts": 1295649890609.047, "dur": 6.234, "args": { "External id": 12325,"Record function id": 0, "Concrete Inputs": ["", "[1, 4096]", "False"], "Input type": ["long int", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[4096], [], []], "Ev Idx": 5820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649890613.183, "dur": 1.800, "args": { "External id": 12326,"Record function id": 0, "Concrete Inputs": ["", "[1, 4096]", "[4096, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[4096], [], [], []], "Ev Idx": 5821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649890616.222, "dur": 4.072, "args": { "External id": 12327,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336759, "tid": 1336759, "ts": 1295649890622.587, "dur": 2.955, "args": { "External id": 12328,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[4096, 1]], "Input Dims": [[16, 4096]], "Ev Idx": 5823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unfold", "pid": 1336759, "tid": 1336759, "ts": 1295649890630.426, "dur": 4.790, "args": { "External id": 12329,"Record function id": 0, "Concrete Inputs": ["", "0", "1", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 5824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649890634.436, "dur": 0.626, "args": { "External id": 12330,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1]", "[4096, 1, 4096]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 5825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unfold", "pid": 1336759, "tid": 1336759, "ts": 1295649890635.971, "dur": 3.436, "args": { "External id": 12331,"Record function id": 0, "Concrete Inputs": ["", "1", "4096", "4096"], "Input type": ["long int", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 4096], [], [], []], "Input Dims": [[16, 4096, 1], [], [], []], "Ev Idx": 5826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649890638.482, "dur": 0.832, "args": { "External id": 12332,"Record function id": 0, "Concrete Inputs": ["", "[16, 1, 1, 4096]", "[4096, 4096, 4096, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1, 4096], [], [], []], "Input Dims": [[16, 4096, 1], [], [], []], "Ev Idx": 5827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::expand_as", "pid": 1336759, "tid": 1336759, "ts": 1295649890641.418, "dur": 4.047, "args": { "External id": 12333,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["long int", "long int"], "Input Strides": [[4096, 1], [4096, 4096, 4096, 1]], "Input Dims": [[1, 4096], [16, 1, 1, 4096]], "Ev Idx": 5828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::expand", "pid": 1336759, "tid": 1336759, "ts": 1295649890642.978, "dur": 2.256, "args": { "External id": 12334,"Record function id": 0, "Concrete Inputs": ["", "[16, 1, 1, 4096]", "False"], "Input type": ["long int", "ScalarList", "Scalar"], "Input Strides": [[4096, 1], [], []], "Input Dims": [[1, 4096], [], []], "Ev Idx": 5829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649890644.439, "dur": 0.703, "args": { "External id": 12335,"Record function id": 0, "Concrete Inputs": ["", "[16, 1, 1, 4096]", "[0, 4096, 4096, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[1, 4096], [], [], []], "Ev Idx": 5830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649890646.731, "dur": 24.338, "args": { "External id": 12336,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 4096, 4096, 1], [0, 4096, 4096, 1], []], "Input Dims": [[16, 1, 1, 4096], [16, 1, 1, 4096], []], "Ev Idx": 5831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295649890680.539, "dur": 27.262, "args": { "External id": 12337,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "3", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[4096, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 5832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649890682.068, "dur": 25.558, "args": { "External id": 12338,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "3", "", "", "", "False", ""], "Input type": ["long int", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[4096, 1], [], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], [], []], "Ev Idx": 5833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649890687.859, "dur": 3.219, "args": { "External id": 12339,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "[4096, 1]", "3", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649890691.755, "dur": 15.354, "args": { "External id": 12340,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["int", "long int", "Scalar"], "Input Strides": [[4096, 1], [4096, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 5835 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::root_pre_forward", "pid": 1336759, "tid": 1336759, "ts": 1295649890815.628, "dur": 141.641, "args": { "External id": 12341,"Record function id": 0, "Ev Idx": 5836 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::inputs_to_device", "pid": 1336759, "tid": 1336759, "ts": 1295649890891.596, "dur": 55.062, "args": { "External id": 12342,"Record function id": 0, "Ev Idx": 5837 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295649890963.931, "dur": 91.209, "args": { "External id": 12343,"Record function id": 0, "Ev Idx": 5838 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward", "pid": 1336759, "tid": 1336759, "ts": 1295649891064.194, "dur": 10589.104, "args": { "External id": 12344,"Record function id": 0, "Ev Idx": 5839 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather", "pid": 1336759, "tid": 1336759, "ts": 1295649891073.808, "dur": 1215.713, "args": { "External id": 12345,"Record function id": 0, "Ev Idx": 5840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649891174.698, "dur": 7.488, "args": { "External id": 12346,"Record function id": 0, "Concrete Inputs": ["[42076416]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295649891198.758, "dur": 130.896, "args": { "External id": 12347,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["c10::BFloat16", "", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[42076416], [], []], "Ev Idx": 5842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891203.672, "dur": 1.535, "args": { "External id": 12348,"Record function id": 0, "Concrete Inputs": ["", "[8192000]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891210.089, "dur": 0.212, "args": { "External id": 12349,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8192000"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891211.049, "dur": 0.416, "args": { "External id": 12350,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "8192256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891211.995, "dur": 1.544, "args": { "External id": 12351,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "8716544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891217.380, "dur": 0.338, "args": { "External id": 12352,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "9240832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891218.261, "dur": 0.309, "args": { "External id": 12353,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "9765120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891219.122, "dur": 2.327, "args": { "External id": 12354,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "10289408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891223.488, "dur": 0.181, "args": { "External id": 12355,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "10289664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891224.176, "dur": 0.265, "args": { "External id": 12356,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11731456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891250.613, "dur": 0.676, "args": { "External id": 12357,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "13173248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891253.239, "dur": 0.272, "args": { "External id": 12358,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "14615040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891254.094, "dur": 1.408, "args": { "External id": 12359,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "14615296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891258.146, "dur": 0.442, "args": { "External id": 12360,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "15139584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891259.280, "dur": 0.335, "args": { "External id": 12361,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "15663872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891260.229, "dur": 2.515, "args": { "External id": 12362,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "16188160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891264.306, "dur": 0.171, "args": { "External id": 12363,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "16712448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891265.179, "dur": 0.138, "args": { "External id": 12364,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "16712704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891268.646, "dur": 0.232, "args": { "External id": 12365,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "18154496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891269.562, "dur": 0.306, "args": { "External id": 12366,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "19596288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891270.896, "dur": 1.266, "args": { "External id": 12367,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "21038080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891275.558, "dur": 0.289, "args": { "External id": 12368,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "21038336"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891276.378, "dur": 0.381, "args": { "External id": 12369,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "21562624"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891277.353, "dur": 1.798, "args": { "External id": 12370,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "22086912"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891282.040, "dur": 0.173, "args": { "External id": 12371,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "22611200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891283.373, "dur": 0.241, "args": { "External id": 12372,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "23135488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891286.580, "dur": 0.382, "args": { "External id": 12373,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "23135744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891287.702, "dur": 0.347, "args": { "External id": 12374,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "24577536"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891289.062, "dur": 1.400, "args": { "External id": 12375,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "26019328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891293.037, "dur": 0.505, "args": { "External id": 12376,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27461120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891294.401, "dur": 0.291, "args": { "External id": 12377,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27461376"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891295.634, "dur": 2.360, "args": { "External id": 12378,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27985664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891298.785, "dur": 0.127, "args": { "External id": 12379,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "28509952"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891299.946, "dur": 0.258, "args": { "External id": 12380,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "29034240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891303.090, "dur": 0.140, "args": { "External id": 12381,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "29558528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891304.195, "dur": 0.443, "args": { "External id": 12382,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29558784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891305.500, "dur": 1.008, "args": { "External id": 12383,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "31000576"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891309.472, "dur": 0.324, "args": { "External id": 12384,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "32442368"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891310.719, "dur": 0.474, "args": { "External id": 12385,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "33884160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891312.045, "dur": 2.065, "args": { "External id": 12386,"Record function id": 0, "Concrete Inputs": ["", "[8192000]", "[1]", "33884416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649891350.955, "dur": 78.670, "args": { "External id": 12387,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 5882 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295649891496.293, "dur": 220.633, "args": { "External id": 12388,"Record function id": 0, "Concrete Inputs": ["", "", "42076416", "8", "6", "15", ""], "Input type": ["TensorList", "", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 5883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649891510.340, "dur": 4.965, "args": { "External id": 12389,"Record function id": 0, "Concrete Inputs": ["[336611328]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295649891521.572, "dur": 11.600, "args": { "External id": 12390,"Record function id": 0, "Concrete Inputs": ["", "0", "252458496", "42076416"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[336611328], [], [], []], "Ev Idx": 5885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295649891526.725, "dur": 6.013, "args": { "External id": 12391,"Record function id": 0, "Concrete Inputs": ["", "0", "252458496", "294534912", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[336611328], [], [], [], []], "Ev Idx": 5886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891530.053, "dur": 0.483, "args": { "External id": 12392,"Record function id": 0, "Concrete Inputs": ["", "[42076416]", "[1]", "252458496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[336611328], [], [], []], "Ev Idx": 5887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295649891541.151, "dur": 88.407, "args": { "External id": 12393,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["c10::BFloat16", "", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[42076416], [], []], "Ev Idx": 5888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891543.498, "dur": 0.533, "args": { "External id": 12394,"Record function id": 0, "Concrete Inputs": ["", "[8192000]", "[1]", "252458496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891545.310, "dur": 0.428, "args": { "External id": 12395,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "260650496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891546.796, "dur": 1.342, "args": { "External id": 12396,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "260650752"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891549.293, "dur": 0.621, "args": { "External id": 12397,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "261175040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891551.004, "dur": 0.465, "args": { "External id": 12398,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "261699328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891552.420, "dur": 0.279, "args": { "External id": 12399,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "262223616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891553.962, "dur": 0.431, "args": { "External id": 12400,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "262747904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891555.407, "dur": 0.434, "args": { "External id": 12401,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "262748160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891556.958, "dur": 0.700, "args": { "External id": 12402,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "264189952"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891558.429, "dur": 0.252, "args": { "External id": 12403,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "265631744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891559.656, "dur": 1.102, "args": { "External id": 12404,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "267073536"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891562.056, "dur": 0.373, "args": { "External id": 12405,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "267073792"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891563.507, "dur": 1.965, "args": { "External id": 12406,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "267598080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891566.385, "dur": 0.359, "args": { "External id": 12407,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "268122368"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891567.888, "dur": 0.283, "args": { "External id": 12408,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "268646656"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891571.478, "dur": 0.400, "args": { "External id": 12409,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "269170944"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891572.889, "dur": 0.299, "args": { "External id": 12410,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "269171200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891574.282, "dur": 0.179, "args": { "External id": 12411,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "270612992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891577.242, "dur": 1.273, "args": { "External id": 12412,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "272054784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891579.495, "dur": 0.330, "args": { "External id": 12413,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "273496576"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891580.988, "dur": 2.573, "args": { "External id": 12414,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "273496832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891584.653, "dur": 0.393, "args": { "External id": 12415,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "274021120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5910 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891586.020, "dur": 0.187, "args": { "External id": 12416,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "274545408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891589.361, "dur": 0.300, "args": { "External id": 12417,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "275069696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891590.524, "dur": 0.300, "args": { "External id": 12418,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "275593984"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891592.252, "dur": 0.144, "args": { "External id": 12419,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "275594240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891594.864, "dur": 0.851, "args": { "External id": 12420,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "277036032"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891596.703, "dur": 0.172, "args": { "External id": 12421,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "278477824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891597.687, "dur": 2.179, "args": { "External id": 12422,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "279919616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891601.013, "dur": 0.309, "args": { "External id": 12423,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "279919872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891602.499, "dur": 0.329, "args": { "External id": 12424,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "280444160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891605.555, "dur": 0.364, "args": { "External id": 12425,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "280968448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891606.702, "dur": 0.422, "args": { "External id": 12426,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "281492736"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891608.378, "dur": 0.337, "args": { "External id": 12427,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "282017024"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891611.654, "dur": 0.901, "args": { "External id": 12428,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "282017280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891613.589, "dur": 0.184, "args": { "External id": 12429,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "283459072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891614.678, "dur": 2.179, "args": { "External id": 12430,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "284900864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891617.628, "dur": 0.151, "args": { "External id": 12431,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "286342656"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649891618.528, "dur": 0.155, "args": { "External id": 12432,"Record function id": 0, "Concrete Inputs": ["", "[8192000]", "[1]", "286342912"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649891646.450, "dur": 56.360, "args": { "External id": 12433,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 5928 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295649891774.302, "dur": 383.855, "args": { "External id": 12434,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[336611328], [42076416], [], [], []], "Ev Idx": 5929 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295649891813.691, "dur": 338.225, "args": { "External id": 12435,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 336611328, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[42076416], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5930, "In msg nelems": 42076416 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295649891824.271, "dur": 321.132, "args": { "External id": 12436,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[42076416]], "Ev Idx": 5931 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295649892184.014, "dur": 2.393, "args": { "External id": 12437,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5932, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out", "pid": 1336759, "tid": 1336759, "ts": 1295649892305.995, "dur": 9170.454, "args": { "External id": 12438,"Record function id": 0, "Ev Idx": 5933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892483.138, "dur": 6.915, "args": { "External id": 12439,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[336611328], []], "Ev Idx": 5934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892493.989, "dur": 0.995, "args": { "External id": 12440,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[65536000], []], "Ev Idx": 5935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892496.682, "dur": 0.887, "args": { "External id": 12441,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892499.526, "dur": 1.923, "args": { "External id": 12442,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892503.047, "dur": 0.731, "args": { "External id": 12443,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892506.805, "dur": 0.777, "args": { "External id": 12444,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892509.233, "dur": 0.887, "args": { "External id": 12445,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892511.868, "dur": 1.760, "args": { "External id": 12446,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892515.099, "dur": 0.572, "args": { "External id": 12447,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892519.032, "dur": 0.651, "args": { "External id": 12448,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892521.287, "dur": 0.679, "args": { "External id": 12449,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892523.469, "dur": 1.500, "args": { "External id": 12450,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892526.601, "dur": 0.489, "args": { "External id": 12451,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892530.265, "dur": 0.508, "args": { "External id": 12452,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892532.068, "dur": 0.678, "args": { "External id": 12453,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892534.177, "dur": 1.262, "args": { "External id": 12454,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892537.004, "dur": 0.523, "args": { "External id": 12455,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892540.354, "dur": 0.581, "args": { "External id": 12456,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892542.824, "dur": 0.512, "args": { "External id": 12457,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892544.945, "dur": 1.290, "args": { "External id": 12458,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892547.709, "dur": 0.691, "args": { "External id": 12459,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892551.252, "dur": 0.534, "args": { "External id": 12460,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892553.286, "dur": 0.460, "args": { "External id": 12461,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892554.982, "dur": 1.194, "args": { "External id": 12462,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892564.559, "dur": 0.686, "args": { "External id": 12463,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892568.379, "dur": 0.789, "args": { "External id": 12464,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892570.580, "dur": 0.582, "args": { "External id": 12465,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892572.667, "dur": 1.586, "args": { "External id": 12466,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892576.086, "dur": 0.563, "args": { "External id": 12467,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892579.722, "dur": 0.653, "args": { "External id": 12468,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892581.796, "dur": 0.694, "args": { "External id": 12469,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892583.731, "dur": 1.382, "args": { "External id": 12470,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892586.644, "dur": 0.575, "args": { "External id": 12471,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892591.072, "dur": 0.683, "args": { "External id": 12472,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892593.528, "dur": 0.791, "args": { "External id": 12473,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892595.659, "dur": 1.154, "args": { "External id": 12474,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892598.575, "dur": 0.454, "args": { "External id": 12475,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892602.073, "dur": 0.681, "args": { "External id": 12476,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892604.636, "dur": 0.824, "args": { "External id": 12477,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649892606.763, "dur": 1.465, "args": { "External id": 12478,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[65536000], []], "Ev Idx": 5973 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649892633.305, "dur": 8791.606, "args": { "External id": 12479,"Record function id": 0, "Concrete Inputs": ["", "", "1", ""], "Input type": ["c10::BFloat16", "", "Scalar", "TensorList"], "Input Strides": [[42076416, 1], [], [], []], "Input Dims": [[8, 42076416], [], [], []], "Ev Idx": 5974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649892656.977, "dur": 8758.930, "args": { "External id": 12480,"Record function id": 0, "Concrete Inputs": ["", "", "1", ""], "Input type": ["c10::BFloat16", "", "Scalar", "TensorList"], "Input Strides": [[42076416, 1], [], [], []], "Input Dims": [[8, 42076416], [], [], []], "Ev Idx": 5975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649892685.265, "dur": 5.795, "args": { "External id": 12481,"Record function id": 0, "Concrete Inputs": ["[4290]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295649892697.501, "dur": 8681.120, "args": { "External id": 12482,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[4290], [], [], [], [], [], [], []], "Ev Idx": 5977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649892700.072, "dur": 8677.581, "args": { "External id": 12483,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[4290], [], [], [], [], [], []], "Ev Idx": 5978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649892705.149, "dur": 5.990, "args": { "External id": 12484,"Record function id": 0, "Concrete Inputs": ["[4290]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649892713.156, "dur": 8661.262, "args": { "External id": 12485,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[4290], [4290], []], "Ev Idx": 5980 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295649901730.503, "dur": 35.642, "args": { "External id": 12486,"Record function id": 0, "Ev Idx": 5981 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 0/0", "pid": 1336759, "tid": 1336759, "ts": 1295649901767.839, "dur": 202.015, "args": { "External id": 12487,"Record function id": 0, "Ev Idx": 5982 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295649901809.227, "dur": 151.680, "args": { "External id": 12488,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "long int"], "Input Strides": [[2048, 1], [4096, 1]], "Input Dims": [[32000, 2048], [16, 4096]], "Ev Idx": 5983 } }, { "ph": "s", "id": 228, "pid": 1336759, "tid": 1336759, "ts": 1295649901809.227, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_0", "pid": 1336759, "tid": 1336759, "ts": 1295649901878.584, "dur": 48.099, "args": { "External id": 12489,"kernel_hash": "czer4rmela5ly34fgupsreshd4qo5eamimqpvrklpagr2lqevpwb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/ze/czer4rmela5ly34fgupsreshd4qo5eamimqpvrklpagr2lqevpwb.py", "kernel_backend": "triton", "Input type": ["long int", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096], [32000, 2048], [16, 4096, 2048], []], "Ev Idx": 5984 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295649902070.617, "dur": 56.935, "args": { "External id": 12490,"Record function id": 0, "Ev Idx": 5985 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.0)", "pid": 1336759, "tid": 1336759, "ts": 1295649902138.400, "dur": 6979.377, "args": { "External id": 12491,"Record function id": 0, "Ev Idx": 5986 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.0)", "pid": 1336759, "tid": 1336759, "ts": 1295649902146.135, "dur": 781.966, "args": { "External id": 12492,"Record function id": 0, "Ev Idx": 5987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649902218.233, "dur": 28.567, "args": { "External id": 12493,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295649902262.446, "dur": 36.487, "args": { "External id": 12494,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902269.449, "dur": 2.609, "args": { "External id": 12495,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902274.434, "dur": 0.595, "args": { "External id": 12496,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902277.013, "dur": 1.923, "args": { "External id": 12497,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902280.352, "dur": 0.350, "args": { "External id": 12498,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902282.182, "dur": 0.148, "args": { "External id": 12499,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902285.638, "dur": 0.170, "args": { "External id": 12500,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902287.199, "dur": 0.161, "args": { "External id": 12501,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902288.605, "dur": 1.152, "args": { "External id": 12502,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902292.816, "dur": 0.480, "args": { "External id": 12503,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649902309.098, "dur": 38.554, "args": { "External id": 12504,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5999 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295649902381.077, "dur": 107.731, "args": { "External id": 12505,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649902392.336, "dur": 4.531, "args": { "External id": 12506,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295649902402.141, "dur": 10.921, "args": { "External id": 12507,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295649902407.076, "dur": 5.574, "args": { "External id": 12508,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902411.022, "dur": 0.454, "args": { "External id": 12509,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295649902419.649, "dur": 27.012, "args": { "External id": 12510,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902422.271, "dur": 0.379, "args": { "External id": 12511,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902424.160, "dur": 0.292, "args": { "External id": 12512,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902427.666, "dur": 0.323, "args": { "External id": 12513,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902429.120, "dur": 0.488, "args": { "External id": 12514,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902431.368, "dur": 2.823, "args": { "External id": 12515,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902435.737, "dur": 0.190, "args": { "External id": 12516,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902437.427, "dur": 0.144, "args": { "External id": 12517,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902440.570, "dur": 0.185, "args": { "External id": 12518,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649902442.440, "dur": 0.158, "args": { "External id": 12519,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649902458.042, "dur": 22.280, "args": { "External id": 12520,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6015 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295649902541.367, "dur": 297.010, "args": { "External id": 12521,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6016 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295649902570.481, "dur": 263.074, "args": { "External id": 12522,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6017, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295649902580.908, "dur": 246.982, "args": { "External id": 12523,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6018 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295649902860.636, "dur": 2.147, "args": { "External id": 12524,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6019, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.0)", "pid": 1336759, "tid": 1336759, "ts": 1295649902947.699, "dur": 5903.133, "args": { "External id": 12525,"Record function id": 0, "Ev Idx": 6020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649903079.205, "dur": 6.758, "args": { "External id": 12526,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649903089.681, "dur": 1.063, "args": { "External id": 12527,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649903092.444, "dur": 0.841, "args": { "External id": 12528,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649903097.431, "dur": 1.705, "args": { "External id": 12529,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649903100.310, "dur": 0.915, "args": { "External id": 12530,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649903102.618, "dur": 0.514, "args": { "External id": 12531,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649903105.339, "dur": 0.694, "args": { "External id": 12532,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649903109.190, "dur": 1.886, "args": { "External id": 12533,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649903112.614, "dur": 0.660, "args": { "External id": 12534,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649903114.573, "dur": 0.605, "args": { "External id": 12535,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6030 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649903133.426, "dur": 5680.523, "args": { "External id": 12536,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649903148.779, "dur": 5658.519, "args": { "External id": 12537,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649903172.197, "dur": 14.167, "args": { "External id": 12538,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295649903191.607, "dur": 5583.591, "args": { "External id": 12539,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649903194.062, "dur": 5580.704, "args": { "External id": 12540,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649903199.692, "dur": 5.698, "args": { "External id": 12541,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649903207.184, "dur": 5564.928, "args": { "External id": 12542,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6037 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295649909053.993, "dur": 37.305, "args": { "External id": 12543,"Sequence number": 246541, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6038 } }, { "ph": "s", "id": 227, "pid": 1336759, "tid": 1336759, "ts": 1295649909053.993, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295649909078.449, "dur": 8.057, "args": { "External id": 12544,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649909081.752, "dur": 4.433, "args": { "External id": 12545,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6040 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295649909159.308, "dur": 123.612, "args": { "External id": 12546,"Record function id": 0, "Ev Idx": 6041 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295649909286.438, "dur": 1154.096, "args": { "External id": 12547,"Record function id": 0, "Ev Idx": 6042 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295649909328.798, "dur": 1098.041, "args": { "External id": 12548,"Sequence number": 246542, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6043 } }, { "ph": "s", "id": 226, "pid": 1336759, "tid": 1336759, "ts": 1295649909328.798, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295649909401.890, "dur": 45.363, "args": { "External id": 12549,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649909459.253, "dur": 102.337, "args": { "External id": 12550,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649909572.577, "dur": 38.301, "args": { "External id": 12551,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649909619.008, "dur": 30.732, "args": { "External id": 12552,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6047 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295649909674.081, "dur": 26.141, "args": { "External id": 12553,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6048 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295649909718.489, "dur": 15.804, "args": { "External id": 12554,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6049 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295649909752.807, "dur": 124.460, "args": { "External id": 12555,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295649909802.685, "dur": 10.019, "args": { "External id": 12556,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649909807.533, "dur": 4.339, "args": { "External id": 12557,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649909815.583, "dur": 3.624, "args": { "External id": 12558,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649909820.724, "dur": 1.081, "args": { "External id": 12559,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649909824.323, "dur": 3.078, "args": { "External id": 12560,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649909886.997, "dur": 43.954, "args": { "External id": 12561,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6056 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295649909960.610, "dur": 118.560, "args": { "External id": 12562,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649910090.528, "dur": 45.982, "args": { "External id": 12563,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649910146.156, "dur": 33.854, "args": { "External id": 12564,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6059 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295649910203.669, "dur": 54.468, "args": { "External id": 12565,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649910266.151, "dur": 38.325, "args": { "External id": 12566,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6061 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295649910333.921, "dur": 21.075, "args": { "External id": 12567,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6062 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.0)", "pid": 1336759, "tid": 1336759, "ts": 1295649910505.504, "dur": 77.283, "args": { "External id": 12568,"Record function id": 0, "Ev Idx": 6063 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295649910654.036, "dur": 45.014, "args": { "External id": 12569,"Record function id": 0, "Ev Idx": 6064 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.1)", "pid": 1336759, "tid": 1336759, "ts": 1295649910707.603, "dur": 18800.555, "args": { "External id": 12570,"Record function id": 0, "Ev Idx": 6065 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.1)", "pid": 1336759, "tid": 1336759, "ts": 1295649910714.986, "dur": 939.698, "args": { "External id": 12571,"Record function id": 0, "Ev Idx": 6066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649910790.778, "dur": 8.429, "args": { "External id": 12572,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295649910812.678, "dur": 41.222, "args": { "External id": 12573,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649910818.287, "dur": 4.332, "args": { "External id": 12574,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649910825.331, "dur": 0.411, "args": { "External id": 12575,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649910827.727, "dur": 0.457, "args": { "External id": 12576,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649910832.393, "dur": 0.274, "args": { "External id": 12577,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649910834.490, "dur": 1.403, "args": { "External id": 12578,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649910837.966, "dur": 0.141, "args": { "External id": 12579,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649910840.165, "dur": 0.270, "args": { "External id": 12580,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649910842.970, "dur": 0.324, "args": { "External id": 12581,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649910846.062, "dur": 2.302, "args": { "External id": 12582,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649910865.121, "dur": 39.968, "args": { "External id": 12583,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6078 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295649910937.092, "dur": 186.855, "args": { "External id": 12584,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649910947.960, "dur": 3.713, "args": { "External id": 12585,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295649910956.594, "dur": 10.934, "args": { "External id": 12586,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295649910961.302, "dur": 5.777, "args": { "External id": 12587,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649910965.370, "dur": 0.494, "args": { "External id": 12588,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295649910975.172, "dur": 95.258, "args": { "External id": 12589,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649910977.705, "dur": 0.324, "args": { "External id": 12590,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649910980.601, "dur": 65.026, "args": { "External id": 12591,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649911049.301, "dur": 2.278, "args": { "External id": 12592,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649911053.257, "dur": 0.458, "args": { "External id": 12593,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649911055.227, "dur": 0.307, "args": { "External id": 12594,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649911059.463, "dur": 0.296, "args": { "External id": 12595,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649911060.972, "dur": 0.315, "args": { "External id": 12596,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649911062.936, "dur": 0.436, "args": { "External id": 12597,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649911066.374, "dur": 0.278, "args": { "External id": 12598,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649911083.882, "dur": 30.976, "args": { "External id": 12599,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6094 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295649911177.384, "dur": 383.692, "args": { "External id": 12600,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6095 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295649911217.719, "dur": 338.416, "args": { "External id": 12601,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6096, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295649911248.925, "dur": 300.941, "args": { "External id": 12602,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6097 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295649911584.805, "dur": 1.998, "args": { "External id": 12603,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6098, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.1)", "pid": 1336759, "tid": 1336759, "ts": 1295649911675.254, "dur": 17646.354, "args": { "External id": 12604,"Record function id": 0, "Ev Idx": 6099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649911765.406, "dur": 6.477, "args": { "External id": 12605,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649911775.253, "dur": 1.059, "args": { "External id": 12606,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649911778.318, "dur": 0.816, "args": { "External id": 12607,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649911781.019, "dur": 0.726, "args": { "External id": 12608,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649911783.265, "dur": 0.601, "args": { "External id": 12609,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649911786.905, "dur": 1.179, "args": { "External id": 12610,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649911790.102, "dur": 0.717, "args": { "External id": 12611,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649911792.505, "dur": 2.627, "args": { "External id": 12612,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649911796.609, "dur": 0.582, "args": { "External id": 12613,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649911801.010, "dur": 0.505, "args": { "External id": 12614,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6109 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649911819.623, "dur": 17462.429, "args": { "External id": 12615,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649911834.657, "dur": 17440.222, "args": { "External id": 12616,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649911856.497, "dur": 12.246, "args": { "External id": 12617,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295649911871.353, "dur": 17355.094, "args": { "External id": 12618,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649911874.149, "dur": 17351.801, "args": { "External id": 12619,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649911879.499, "dur": 4.937, "args": { "External id": 12620,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649911886.013, "dur": 17336.716, "args": { "External id": 12621,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6116 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295649929449.703, "dur": 34.620, "args": { "External id": 12622,"Sequence number": 246543, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6117 } }, { "ph": "s", "id": 225, "pid": 1336759, "tid": 1336759, "ts": 1295649929449.703, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295649929471.646, "dur": 8.046, "args": { "External id": 12623,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649929475.045, "dur": 4.422, "args": { "External id": 12624,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6119 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295649929547.153, "dur": 76.970, "args": { "External id": 12625,"Record function id": 0, "Ev Idx": 6120 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295649929625.538, "dur": 1036.062, "args": { "External id": 12626,"Record function id": 0, "Ev Idx": 6121 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295649929664.192, "dur": 984.340, "args": { "External id": 12627,"Sequence number": 246544, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6122 } }, { "ph": "s", "id": 224, "pid": 1336759, "tid": 1336759, "ts": 1295649929664.192, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295649929731.765, "dur": 38.415, "args": { "External id": 12628,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649929782.968, "dur": 100.556, "args": { "External id": 12629,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649929890.720, "dur": 35.276, "args": { "External id": 12630,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649929931.278, "dur": 30.771, "args": { "External id": 12631,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6126 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295649930026.756, "dur": 30.675, "args": { "External id": 12632,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6127 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295649930075.078, "dur": 17.237, "args": { "External id": 12633,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6128 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295649930107.557, "dur": 144.269, "args": { "External id": 12634,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295649930156.410, "dur": 12.989, "args": { "External id": 12635,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649930161.040, "dur": 7.506, "args": { "External id": 12636,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649930172.267, "dur": 4.444, "args": { "External id": 12637,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649930177.928, "dur": 2.921, "args": { "External id": 12638,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649930183.019, "dur": 3.013, "args": { "External id": 12639,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649930264.533, "dur": 54.691, "args": { "External id": 12640,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6135 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295649930350.301, "dur": 26.928, "args": { "External id": 12641,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649930385.662, "dur": 41.850, "args": { "External id": 12642,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649930433.760, "dur": 34.560, "args": { "External id": 12643,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6138 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295649930492.410, "dur": 21.574, "args": { "External id": 12644,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649930518.960, "dur": 33.046, "args": { "External id": 12645,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6140 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295649930568.871, "dur": 19.093, "args": { "External id": 12646,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6141 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.1)", "pid": 1336759, "tid": 1336759, "ts": 1295649930723.280, "dur": 74.766, "args": { "External id": 12647,"Record function id": 0, "Ev Idx": 6142 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295649930871.786, "dur": 47.352, "args": { "External id": 12648,"Record function id": 0, "Ev Idx": 6143 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.2)", "pid": 1336759, "tid": 1336759, "ts": 1295649930927.922, "dur": 18692.352, "args": { "External id": 12649,"Record function id": 0, "Ev Idx": 6144 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.2)", "pid": 1336759, "tid": 1336759, "ts": 1295649930936.674, "dur": 890.962, "args": { "External id": 12650,"Record function id": 0, "Ev Idx": 6145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649931060.573, "dur": 9.051, "args": { "External id": 12651,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295649931082.442, "dur": 33.172, "args": { "External id": 12652,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931087.747, "dur": 2.308, "args": { "External id": 12653,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931093.850, "dur": 0.250, "args": { "External id": 12654,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931095.380, "dur": 0.367, "args": { "External id": 12655,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931096.748, "dur": 0.366, "args": { "External id": 12656,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931100.098, "dur": 0.393, "args": { "External id": 12657,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931101.520, "dur": 0.488, "args": { "External id": 12658,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931103.076, "dur": 3.360, "args": { "External id": 12659,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931107.351, "dur": 0.513, "args": { "External id": 12660,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931109.209, "dur": 0.332, "args": { "External id": 12661,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649931125.528, "dur": 41.449, "args": { "External id": 12662,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6157 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295649931199.722, "dur": 128.660, "args": { "External id": 12663,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649931211.361, "dur": 3.867, "args": { "External id": 12664,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295649931220.336, "dur": 30.156, "args": { "External id": 12665,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295649931225.480, "dur": 24.548, "args": { "External id": 12666,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931247.316, "dur": 0.877, "args": { "External id": 12667,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295649931258.364, "dur": 25.674, "args": { "External id": 12668,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931260.563, "dur": 2.273, "args": { "External id": 12669,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931263.950, "dur": 0.313, "args": { "External id": 12670,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931265.525, "dur": 0.315, "args": { "External id": 12671,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931268.833, "dur": 1.407, "args": { "External id": 12672,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931271.719, "dur": 0.311, "args": { "External id": 12673,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931272.941, "dur": 0.292, "args": { "External id": 12674,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931275.844, "dur": 0.246, "args": { "External id": 12675,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931276.859, "dur": 0.301, "args": { "External id": 12676,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649931278.187, "dur": 2.078, "args": { "External id": 12677,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649931294.161, "dur": 26.300, "args": { "External id": 12678,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6173 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295649931382.796, "dur": 350.366, "args": { "External id": 12679,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6174 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295649931411.857, "dur": 315.888, "args": { "External id": 12680,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6175, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295649931422.688, "dur": 299.619, "args": { "External id": 12681,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6176 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295649931757.330, "dur": 2.481, "args": { "External id": 12682,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6177, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.2)", "pid": 1336759, "tid": 1336759, "ts": 1295649931848.632, "dur": 17582.289, "args": { "External id": 12683,"Record function id": 0, "Ev Idx": 6178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649931939.072, "dur": 6.179, "args": { "External id": 12684,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649931948.998, "dur": 1.030, "args": { "External id": 12685,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649931951.639, "dur": 1.630, "args": { "External id": 12686,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649931954.966, "dur": 0.779, "args": { "External id": 12687,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649931956.978, "dur": 0.681, "args": { "External id": 12688,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649931959.159, "dur": 0.654, "args": { "External id": 12689,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649931965.240, "dur": 0.810, "args": { "External id": 12690,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649931967.760, "dur": 1.703, "args": { "External id": 12691,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649931970.873, "dur": 0.676, "args": { "External id": 12692,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649931973.202, "dur": 0.591, "args": { "External id": 12693,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6188 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649932031.929, "dur": 17360.070, "args": { "External id": 12694,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649932048.154, "dur": 17337.166, "args": { "External id": 12695,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649932071.066, "dur": 14.257, "args": { "External id": 12696,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295649932088.677, "dur": 17265.190, "args": { "External id": 12697,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649932091.352, "dur": 17261.965, "args": { "External id": 12698,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649932097.006, "dur": 6.891, "args": { "External id": 12699,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649932105.692, "dur": 17244.661, "args": { "External id": 12700,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6195 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295649949562.773, "dur": 33.532, "args": { "External id": 12701,"Sequence number": 246545, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6196 } }, { "ph": "s", "id": 223, "pid": 1336759, "tid": 1336759, "ts": 1295649949562.773, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295649949584.387, "dur": 7.303, "args": { "External id": 12702,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649949587.245, "dur": 4.240, "args": { "External id": 12703,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6198 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295649949656.320, "dur": 75.186, "args": { "External id": 12704,"Record function id": 0, "Ev Idx": 6199 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295649949733.072, "dur": 1039.700, "args": { "External id": 12705,"Record function id": 0, "Ev Idx": 6200 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295649949772.966, "dur": 986.958, "args": { "External id": 12706,"Sequence number": 246546, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6201 } }, { "ph": "s", "id": 222, "pid": 1336759, "tid": 1336759, "ts": 1295649949772.966, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295649949837.937, "dur": 42.023, "args": { "External id": 12707,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649949891.852, "dur": 137.020, "args": { "External id": 12708,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649950042.740, "dur": 43.121, "args": { "External id": 12709,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649950094.194, "dur": 30.141, "args": { "External id": 12710,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6205 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295649950150.297, "dur": 25.123, "args": { "External id": 12711,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6206 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295649950191.415, "dur": 14.823, "args": { "External id": 12712,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6207 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295649950224.738, "dur": 144.401, "args": { "External id": 12713,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295649950293.345, "dur": 11.554, "args": { "External id": 12714,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649950298.351, "dur": 5.611, "args": { "External id": 12715,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649950307.429, "dur": 4.299, "args": { "External id": 12716,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649950313.048, "dur": 0.975, "args": { "External id": 12717,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649950316.238, "dur": 3.298, "args": { "External id": 12718,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649950380.209, "dur": 48.248, "args": { "External id": 12719,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6214 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295649950457.028, "dur": 26.109, "args": { "External id": 12720,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649950490.814, "dur": 39.635, "args": { "External id": 12721,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649950537.855, "dur": 34.522, "args": { "External id": 12722,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6217 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295649950592.965, "dur": 23.398, "args": { "External id": 12723,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295649950621.914, "dur": 33.337, "args": { "External id": 12724,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6219 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295649950677.520, "dur": 16.097, "args": { "External id": 12725,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6220 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.2)", "pid": 1336759, "tid": 1336759, "ts": 1295649950834.759, "dur": 73.220, "args": { "External id": 12726,"Record function id": 0, "Ev Idx": 6221 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295649950980.567, "dur": 94.890, "args": { "External id": 12727,"Record function id": 0, "Ev Idx": 6222 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.3)", "pid": 1336759, "tid": 1336759, "ts": 1295649951085.364, "dur": 85341.431, "args": { "External id": 12728,"Record function id": 0, "Ev Idx": 6223 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.3)", "pid": 1336759, "tid": 1336759, "ts": 1295649951093.697, "dur": 947.664, "args": { "External id": 12729,"Record function id": 0, "Ev Idx": 6224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649951170.341, "dur": 8.895, "args": { "External id": 12730,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295649951192.852, "dur": 53.489, "args": { "External id": 12731,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951198.433, "dur": 2.463, "args": { "External id": 12732,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951205.508, "dur": 0.267, "args": { "External id": 12733,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951207.077, "dur": 0.354, "args": { "External id": 12734,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951212.784, "dur": 0.336, "args": { "External id": 12735,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951215.905, "dur": 0.573, "args": { "External id": 12736,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951217.391, "dur": 0.446, "args": { "External id": 12737,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951218.777, "dur": 2.670, "args": { "External id": 12738,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951222.611, "dur": 0.173, "args": { "External id": 12739,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951223.913, "dur": 0.345, "args": { "External id": 12740,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649951258.227, "dur": 43.077, "args": { "External id": 12741,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6236 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295649951336.533, "dur": 117.577, "args": { "External id": 12742,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649951348.835, "dur": 4.755, "args": { "External id": 12743,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295649951358.476, "dur": 10.359, "args": { "External id": 12744,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295649951363.005, "dur": 5.437, "args": { "External id": 12745,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951366.411, "dur": 0.676, "args": { "External id": 12746,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295649951375.912, "dur": 28.820, "args": { "External id": 12747,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951377.698, "dur": 2.246, "args": { "External id": 12748,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951381.585, "dur": 0.277, "args": { "External id": 12749,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951383.128, "dur": 0.300, "args": { "External id": 12750,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951387.392, "dur": 1.242, "args": { "External id": 12751,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951389.608, "dur": 0.304, "args": { "External id": 12752,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951391.258, "dur": 0.389, "args": { "External id": 12753,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951394.811, "dur": 0.563, "args": { "External id": 12754,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951396.734, "dur": 0.313, "args": { "External id": 12755,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649951398.527, "dur": 2.242, "args": { "External id": 12756,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649951422.957, "dur": 23.437, "args": { "External id": 12757,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6252 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295649951507.059, "dur": 396.481, "args": { "External id": 12758,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6253 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295649951534.241, "dur": 363.897, "args": { "External id": 12759,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6254, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295649951547.914, "dur": 344.568, "args": { "External id": 12760,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6255 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295649951929.149, "dur": 2.357, "args": { "External id": 12761,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6256, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.3)", "pid": 1336759, "tid": 1336759, "ts": 1295649952065.668, "dur": 84142.801, "args": { "External id": 12762,"Record function id": 0, "Ev Idx": 6257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649952164.795, "dur": 6.709, "args": { "External id": 12763,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649952175.074, "dur": 0.906, "args": { "External id": 12764,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649952177.829, "dur": 1.889, "args": { "External id": 12765,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649952181.616, "dur": 0.940, "args": { "External id": 12766,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649952183.933, "dur": 0.877, "args": { "External id": 12767,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649952186.196, "dur": 0.701, "args": { "External id": 12768,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649952190.257, "dur": 0.848, "args": { "External id": 12769,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649952192.460, "dur": 1.827, "args": { "External id": 12770,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649952196.069, "dur": 0.492, "args": { "External id": 12771,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295649952197.772, "dur": 0.790, "args": { "External id": 12772,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6267 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649952218.800, "dur": 83943.723, "args": { "External id": 12773,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649952253.205, "dur": 83901.457, "args": { "External id": 12774,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295649952276.578, "dur": 14.072, "args": { "External id": 12775,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295649952293.921, "dur": 83826.518, "args": { "External id": 12776,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295649952296.493, "dur": 83823.187, "args": { "External id": 12777,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295649952302.022, "dur": 5.802, "args": { "External id": 12778,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295649952309.535, "dur": 83807.040, "args": { "External id": 12779,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6274 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650036357.730, "dur": 43.065, "args": { "External id": 12780,"Sequence number": 246547, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6275 } }, { "ph": "s", "id": 221, "pid": 1336759, "tid": 1336759, "ts": 1295650036357.730, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650036387.177, "dur": 8.708, "args": { "External id": 12781,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650036390.560, "dur": 5.026, "args": { "External id": 12782,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6277 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650036465.075, "dur": 73.920, "args": { "External id": 12783,"Record function id": 0, "Ev Idx": 6278 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650036540.801, "dur": 1080.676, "args": { "External id": 12784,"Record function id": 0, "Ev Idx": 6279 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650036580.326, "dur": 1027.469, "args": { "External id": 12785,"Sequence number": 246548, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6280 } }, { "ph": "s", "id": 220, "pid": 1336759, "tid": 1336759, "ts": 1295650036580.326, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650036644.262, "dur": 42.847, "args": { "External id": 12786,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650036698.166, "dur": 101.503, "args": { "External id": 12787,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650036810.510, "dur": 38.017, "args": { "External id": 12788,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650036855.047, "dur": 31.564, "args": { "External id": 12789,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6284 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650036914.309, "dur": 23.601, "args": { "External id": 12790,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6285 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650036953.101, "dur": 12.965, "args": { "External id": 12791,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6286 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650037021.715, "dur": 133.765, "args": { "External id": 12792,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650037073.756, "dur": 12.703, "args": { "External id": 12793,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650037078.858, "dur": 6.629, "args": { "External id": 12794,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650037089.245, "dur": 5.115, "args": { "External id": 12795,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650037095.939, "dur": 1.268, "args": { "External id": 12796,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650037101.874, "dur": 3.876, "args": { "External id": 12797,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650037166.551, "dur": 51.735, "args": { "External id": 12798,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6293 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650037266.694, "dur": 28.833, "args": { "External id": 12799,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650037305.661, "dur": 43.950, "args": { "External id": 12800,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650037381.273, "dur": 35.016, "args": { "External id": 12801,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6296 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650037442.533, "dur": 23.336, "args": { "External id": 12802,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650037471.570, "dur": 34.762, "args": { "External id": 12803,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6298 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650037524.251, "dur": 19.388, "args": { "External id": 12804,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6299 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.3)", "pid": 1336759, "tid": 1336759, "ts": 1295650037684.724, "dur": 73.118, "args": { "External id": 12805,"Record function id": 0, "Ev Idx": 6300 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650037832.129, "dur": 45.751, "args": { "External id": 12806,"Record function id": 0, "Ev Idx": 6301 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.4)", "pid": 1336759, "tid": 1336759, "ts": 1295650037886.827, "dur": 19651.820, "args": { "External id": 12807,"Record function id": 0, "Ev Idx": 6302 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.4)", "pid": 1336759, "tid": 1336759, "ts": 1295650037895.613, "dur": 901.685, "args": { "External id": 12808,"Record function id": 0, "Ev Idx": 6303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650037969.948, "dur": 7.855, "args": { "External id": 12809,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650038033.483, "dur": 33.448, "args": { "External id": 12810,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038038.731, "dur": 2.496, "args": { "External id": 12811,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038045.610, "dur": 0.356, "args": { "External id": 12812,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038047.153, "dur": 0.417, "args": { "External id": 12813,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038048.793, "dur": 0.550, "args": { "External id": 12814,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038051.871, "dur": 0.180, "args": { "External id": 12815,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038053.464, "dur": 0.712, "args": { "External id": 12816,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038055.643, "dur": 2.836, "args": { "External id": 12817,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038059.662, "dur": 0.383, "args": { "External id": 12818,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038061.209, "dur": 0.290, "args": { "External id": 12819,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650038077.035, "dur": 45.684, "args": { "External id": 12820,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6315 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650038155.864, "dur": 129.146, "args": { "External id": 12821,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650038166.846, "dur": 5.627, "args": { "External id": 12822,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650038177.476, "dur": 10.116, "args": { "External id": 12823,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650038182.333, "dur": 4.861, "args": { "External id": 12824,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038185.576, "dur": 0.462, "args": { "External id": 12825,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650038194.024, "dur": 28.435, "args": { "External id": 12826,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038196.313, "dur": 2.470, "args": { "External id": 12827,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038199.957, "dur": 0.464, "args": { "External id": 12828,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038201.908, "dur": 0.521, "args": { "External id": 12829,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038205.552, "dur": 1.486, "args": { "External id": 12830,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038208.321, "dur": 0.478, "args": { "External id": 12831,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038210.081, "dur": 0.360, "args": { "External id": 12832,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038213.213, "dur": 0.319, "args": { "External id": 12833,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038214.752, "dur": 0.402, "args": { "External id": 12834,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650038216.156, "dur": 2.251, "args": { "External id": 12835,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650038249.910, "dur": 26.794, "args": { "External id": 12836,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6331 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650038340.050, "dur": 363.170, "args": { "External id": 12837,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6332 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650038369.420, "dur": 328.858, "args": { "External id": 12838,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6333, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650038381.174, "dur": 311.605, "args": { "External id": 12839,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6334 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650038727.529, "dur": 2.256, "args": { "External id": 12840,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6335, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.4)", "pid": 1336759, "tid": 1336759, "ts": 1295650038818.111, "dur": 18535.533, "args": { "External id": 12841,"Record function id": 0, "Ev Idx": 6336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650038911.367, "dur": 6.214, "args": { "External id": 12842,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650038921.098, "dur": 0.662, "args": { "External id": 12843,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650038923.580, "dur": 2.149, "args": { "External id": 12844,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650038927.334, "dur": 0.756, "args": { "External id": 12845,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650038929.607, "dur": 0.840, "args": { "External id": 12846,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650038931.764, "dur": 0.587, "args": { "External id": 12847,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650038935.629, "dur": 0.867, "args": { "External id": 12848,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650038938.163, "dur": 1.688, "args": { "External id": 12849,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650038941.004, "dur": 0.565, "args": { "External id": 12850,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650038942.949, "dur": 0.630, "args": { "External id": 12851,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6346 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650038963.109, "dur": 18351.155, "args": { "External id": 12852,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650038977.942, "dur": 18329.556, "args": { "External id": 12853,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650039040.181, "dur": 15.367, "args": { "External id": 12854,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650039059.068, "dur": 18217.433, "args": { "External id": 12855,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650039061.508, "dur": 18214.431, "args": { "External id": 12856,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650039067.627, "dur": 6.537, "args": { "External id": 12857,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650039075.962, "dur": 18197.129, "args": { "External id": 12858,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6353 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650057480.504, "dur": 33.412, "args": { "External id": 12859,"Sequence number": 246549, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6354 } }, { "ph": "s", "id": 219, "pid": 1336759, "tid": 1336759, "ts": 1295650057480.504, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650057501.419, "dur": 7.724, "args": { "External id": 12860,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650057504.544, "dur": 4.413, "args": { "External id": 12861,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6356 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650057575.434, "dur": 78.117, "args": { "External id": 12862,"Record function id": 0, "Ev Idx": 6357 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650057655.107, "dur": 1062.035, "args": { "External id": 12863,"Record function id": 0, "Ev Idx": 6358 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650057691.128, "dur": 1013.278, "args": { "External id": 12864,"Sequence number": 246550, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6359 } }, { "ph": "s", "id": 218, "pid": 1336759, "tid": 1336759, "ts": 1295650057691.128, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650057757.497, "dur": 39.222, "args": { "External id": 12865,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650057808.486, "dur": 104.495, "args": { "External id": 12866,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650057922.409, "dur": 37.909, "args": { "External id": 12867,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650057968.585, "dur": 75.048, "args": { "External id": 12868,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6363 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650058073.714, "dur": 28.103, "args": { "External id": 12869,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6364 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650058118.495, "dur": 14.236, "args": { "External id": 12870,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6365 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650058150.063, "dur": 148.684, "args": { "External id": 12871,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650058198.794, "dur": 11.250, "args": { "External id": 12872,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650058203.444, "dur": 5.790, "args": { "External id": 12873,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650058212.692, "dur": 4.824, "args": { "External id": 12874,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650058218.868, "dur": 1.349, "args": { "External id": 12875,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650058222.591, "dur": 3.971, "args": { "External id": 12876,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650058310.865, "dur": 51.850, "args": { "External id": 12877,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6372 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650058394.414, "dur": 27.036, "args": { "External id": 12878,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650058430.062, "dur": 41.303, "args": { "External id": 12879,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650058479.979, "dur": 34.173, "args": { "External id": 12880,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6375 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650058535.497, "dur": 25.396, "args": { "External id": 12881,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650058566.056, "dur": 33.193, "args": { "External id": 12882,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6377 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650058620.347, "dur": 16.974, "args": { "External id": 12883,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6378 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.4)", "pid": 1336759, "tid": 1336759, "ts": 1295650058779.488, "dur": 72.093, "args": { "External id": 12884,"Record function id": 0, "Ev Idx": 6379 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650058925.173, "dur": 46.172, "args": { "External id": 12885,"Record function id": 0, "Ev Idx": 6380 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.5)", "pid": 1336759, "tid": 1336759, "ts": 1295650058979.860, "dur": 19054.137, "args": { "External id": 12886,"Record function id": 0, "Ev Idx": 6381 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.5)", "pid": 1336759, "tid": 1336759, "ts": 1295650059030.476, "dur": 828.954, "args": { "External id": 12887,"Record function id": 0, "Ev Idx": 6382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650059109.547, "dur": 9.580, "args": { "External id": 12888,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650059132.325, "dur": 33.210, "args": { "External id": 12889,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059137.601, "dur": 2.095, "args": { "External id": 12890,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059143.420, "dur": 0.283, "args": { "External id": 12891,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059145.064, "dur": 0.356, "args": { "External id": 12892,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059146.497, "dur": 0.457, "args": { "External id": 12893,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059149.898, "dur": 0.488, "args": { "External id": 12894,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059151.521, "dur": 0.408, "args": { "External id": 12895,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059153.212, "dur": 2.981, "args": { "External id": 12896,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059157.688, "dur": 0.195, "args": { "External id": 12897,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059159.073, "dur": 0.291, "args": { "External id": 12898,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650059175.850, "dur": 42.591, "args": { "External id": 12899,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6394 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650059268.947, "dur": 109.458, "args": { "External id": 12900,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650059279.549, "dur": 5.588, "args": { "External id": 12901,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650059290.115, "dur": 10.334, "args": { "External id": 12902,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650059294.638, "dur": 5.366, "args": { "External id": 12903,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059297.908, "dur": 0.643, "args": { "External id": 12904,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650059307.002, "dur": 26.436, "args": { "External id": 12905,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059309.175, "dur": 2.431, "args": { "External id": 12906,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059313.188, "dur": 0.447, "args": { "External id": 12907,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059314.956, "dur": 0.167, "args": { "External id": 12908,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059318.312, "dur": 1.585, "args": { "External id": 12909,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059321.074, "dur": 0.483, "args": { "External id": 12910,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059322.508, "dur": 0.300, "args": { "External id": 12911,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059325.505, "dur": 0.174, "args": { "External id": 12912,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059326.954, "dur": 0.180, "args": { "External id": 12913,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650059328.103, "dur": 1.754, "args": { "External id": 12914,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650059344.879, "dur": 25.480, "args": { "External id": 12915,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6410 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650059432.435, "dur": 339.113, "args": { "External id": 12916,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6411 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650059461.640, "dur": 305.333, "args": { "External id": 12917,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6412, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650059473.318, "dur": 287.007, "args": { "External id": 12918,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6413 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650059792.828, "dur": 2.220, "args": { "External id": 12919,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6414, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.5)", "pid": 1336759, "tid": 1336759, "ts": 1295650059878.612, "dur": 17937.534, "args": { "External id": 12920,"Record function id": 0, "Ev Idx": 6415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650059969.557, "dur": 5.390, "args": { "External id": 12921,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650059978.174, "dur": 0.779, "args": { "External id": 12922,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650059980.558, "dur": 43.132, "args": { "External id": 12923,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650060028.271, "dur": 0.881, "args": { "External id": 12924,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650060030.402, "dur": 0.716, "args": { "External id": 12925,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650060032.325, "dur": 0.631, "args": { "External id": 12926,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650060036.387, "dur": 0.723, "args": { "External id": 12927,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650060038.830, "dur": 1.761, "args": { "External id": 12928,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650060041.924, "dur": 0.489, "args": { "External id": 12929,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650060044.031, "dur": 0.591, "args": { "External id": 12930,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6425 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650060064.720, "dur": 17712.558, "args": { "External id": 12931,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650060084.866, "dur": 17685.926, "args": { "External id": 12932,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650060105.233, "dur": 15.826, "args": { "External id": 12933,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650060124.128, "dur": 17615.924, "args": { "External id": 12934,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650060126.429, "dur": 17612.777, "args": { "External id": 12935,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650060132.060, "dur": 6.015, "args": { "External id": 12936,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650060140.004, "dur": 17596.203, "args": { "External id": 12937,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6432 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650077945.136, "dur": 33.263, "args": { "External id": 12938,"Sequence number": 246551, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6433 } }, { "ph": "s", "id": 217, "pid": 1336759, "tid": 1336759, "ts": 1295650077945.136, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650077966.422, "dur": 7.522, "args": { "External id": 12939,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650077969.316, "dur": 4.395, "args": { "External id": 12940,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6435 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650078073.163, "dur": 73.898, "args": { "External id": 12941,"Record function id": 0, "Ev Idx": 6436 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650078148.896, "dur": 1049.735, "args": { "External id": 12942,"Record function id": 0, "Ev Idx": 6437 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650078190.577, "dur": 995.240, "args": { "External id": 12943,"Sequence number": 246552, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6438 } }, { "ph": "s", "id": 216, "pid": 1336759, "tid": 1336759, "ts": 1295650078190.577, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650078276.411, "dur": 46.273, "args": { "External id": 12944,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650078337.166, "dur": 103.121, "args": { "External id": 12945,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650078449.663, "dur": 37.454, "args": { "External id": 12946,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650078495.134, "dur": 30.822, "args": { "External id": 12947,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6442 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650078549.381, "dur": 25.371, "args": { "External id": 12948,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6443 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650078591.263, "dur": 13.646, "args": { "External id": 12949,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6444 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650078626.532, "dur": 123.165, "args": { "External id": 12950,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650078673.943, "dur": 11.274, "args": { "External id": 12951,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650078678.712, "dur": 5.638, "args": { "External id": 12952,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650078688.154, "dur": 5.168, "args": { "External id": 12953,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650078694.833, "dur": 1.293, "args": { "External id": 12954,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650078698.249, "dur": 3.964, "args": { "External id": 12955,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650078759.344, "dur": 42.774, "args": { "External id": 12956,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6451 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650078832.006, "dur": 26.817, "args": { "External id": 12957,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650078867.124, "dur": 39.419, "args": { "External id": 12958,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650078914.794, "dur": 33.765, "args": { "External id": 12959,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6454 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650078969.151, "dur": 63.540, "args": { "External id": 12960,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650079040.098, "dur": 38.251, "args": { "External id": 12961,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6456 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650079102.156, "dur": 18.887, "args": { "External id": 12962,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6457 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.5)", "pid": 1336759, "tid": 1336759, "ts": 1295650079280.352, "dur": 73.170, "args": { "External id": 12963,"Record function id": 0, "Ev Idx": 6458 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650079428.928, "dur": 46.527, "args": { "External id": 12964,"Record function id": 0, "Ev Idx": 6459 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.6)", "pid": 1336759, "tid": 1336759, "ts": 1295650079484.000, "dur": 18988.106, "args": { "External id": 12965,"Record function id": 0, "Ev Idx": 6460 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.6)", "pid": 1336759, "tid": 1336759, "ts": 1295650079492.198, "dur": 799.625, "args": { "External id": 12966,"Record function id": 0, "Ev Idx": 6461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650079568.543, "dur": 8.327, "args": { "External id": 12967,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650079589.622, "dur": 33.084, "args": { "External id": 12968,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079595.372, "dur": 2.424, "args": { "External id": 12969,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079601.756, "dur": 0.291, "args": { "External id": 12970,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079603.508, "dur": 0.362, "args": { "External id": 12971,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079605.061, "dur": 0.434, "args": { "External id": 12972,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079608.421, "dur": 0.321, "args": { "External id": 12973,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079609.805, "dur": 0.376, "args": { "External id": 12974,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079611.670, "dur": 2.908, "args": { "External id": 12975,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079615.370, "dur": 0.320, "args": { "External id": 12976,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079617.005, "dur": 0.158, "args": { "External id": 12977,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650079632.771, "dur": 41.930, "args": { "External id": 12978,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6473 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650079706.358, "dur": 99.029, "args": { "External id": 12979,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650079716.685, "dur": 4.136, "args": { "External id": 12980,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650079725.328, "dur": 9.917, "args": { "External id": 12981,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650079729.831, "dur": 4.981, "args": { "External id": 12982,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079733.295, "dur": 0.433, "args": { "External id": 12983,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650079741.583, "dur": 24.865, "args": { "External id": 12984,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079743.115, "dur": 2.121, "args": { "External id": 12985,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079746.193, "dur": 0.445, "args": { "External id": 12986,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079747.997, "dur": 0.289, "args": { "External id": 12987,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079751.233, "dur": 1.214, "args": { "External id": 12988,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079753.795, "dur": 0.185, "args": { "External id": 12989,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079755.005, "dur": 0.339, "args": { "External id": 12990,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079757.839, "dur": 0.178, "args": { "External id": 12991,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079759.181, "dur": 0.288, "args": { "External id": 12992,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650079760.900, "dur": 2.017, "args": { "External id": 12993,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650079775.245, "dur": 22.940, "args": { "External id": 12994,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6489 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650079856.546, "dur": 320.019, "args": { "External id": 12995,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6490 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650079884.023, "dur": 287.084, "args": { "External id": 12996,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6491, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650079895.273, "dur": 270.201, "args": { "External id": 12997,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6492 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650080201.310, "dur": 2.517, "args": { "External id": 12998,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6493, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.6)", "pid": 1336759, "tid": 1336759, "ts": 1295650080314.155, "dur": 17967.861, "args": { "External id": 12999,"Record function id": 0, "Ev Idx": 6494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650080411.846, "dur": 6.728, "args": { "External id": 13000,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650080422.158, "dur": 0.968, "args": { "External id": 13001,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650080424.612, "dur": 2.022, "args": { "External id": 13002,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650080428.262, "dur": 0.784, "args": { "External id": 13003,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650080430.277, "dur": 0.765, "args": { "External id": 13004,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650080432.358, "dur": 0.563, "args": { "External id": 13005,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650080436.107, "dur": 0.732, "args": { "External id": 13006,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650080438.254, "dur": 1.638, "args": { "External id": 13007,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650080441.326, "dur": 0.589, "args": { "External id": 13008,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650080443.221, "dur": 0.495, "args": { "External id": 13009,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6504 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650080463.573, "dur": 17780.650, "args": { "External id": 13010,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650080479.025, "dur": 17747.524, "args": { "External id": 13011,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650080501.634, "dur": 12.979, "args": { "External id": 13012,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650080517.887, "dur": 17677.984, "args": { "External id": 13013,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650080520.374, "dur": 17674.891, "args": { "External id": 13014,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650080525.805, "dur": 5.280, "args": { "External id": 13015,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650080532.642, "dur": 17659.722, "args": { "External id": 13016,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6511 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650098412.792, "dur": 34.123, "args": { "External id": 13017,"Sequence number": 246553, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6512 } }, { "ph": "s", "id": 215, "pid": 1336759, "tid": 1336759, "ts": 1295650098412.792, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650098434.087, "dur": 7.658, "args": { "External id": 13018,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650098437.117, "dur": 4.402, "args": { "External id": 13019,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6514 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650098509.663, "dur": 74.856, "args": { "External id": 13020,"Record function id": 0, "Ev Idx": 6515 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650098585.896, "dur": 1051.866, "args": { "External id": 13021,"Record function id": 0, "Ev Idx": 6516 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650098624.664, "dur": 999.955, "args": { "External id": 13022,"Sequence number": 246554, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6517 } }, { "ph": "s", "id": 214, "pid": 1336759, "tid": 1336759, "ts": 1295650098624.664, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650098691.986, "dur": 41.529, "args": { "External id": 13023,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650098745.183, "dur": 101.040, "args": { "External id": 13024,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650098854.809, "dur": 35.938, "args": { "External id": 13025,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650098899.403, "dur": 32.202, "args": { "External id": 13026,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6521 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650098955.418, "dur": 24.117, "args": { "External id": 13027,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6522 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650099040.087, "dur": 17.883, "args": { "External id": 13028,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6523 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650099076.621, "dur": 125.931, "args": { "External id": 13029,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650099124.335, "dur": 11.633, "args": { "External id": 13030,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650099128.929, "dur": 6.250, "args": { "External id": 13031,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650099138.550, "dur": 5.061, "args": { "External id": 13032,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650099144.837, "dur": 1.201, "args": { "External id": 13033,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650099148.390, "dur": 4.333, "args": { "External id": 13034,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650099212.577, "dur": 65.418, "args": { "External id": 13035,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6530 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650099312.430, "dur": 27.149, "args": { "External id": 13036,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650099348.429, "dur": 42.619, "args": { "External id": 13037,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650099399.870, "dur": 34.091, "args": { "External id": 13038,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6533 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650099456.243, "dur": 25.142, "args": { "External id": 13039,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650099486.780, "dur": 33.889, "args": { "External id": 13040,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6535 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650099540.330, "dur": 16.635, "args": { "External id": 13041,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6536 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.6)", "pid": 1336759, "tid": 1336759, "ts": 1295650099700.531, "dur": 70.703, "args": { "External id": 13042,"Record function id": 0, "Ev Idx": 6537 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650099844.972, "dur": 46.534, "args": { "External id": 13043,"Record function id": 0, "Ev Idx": 6538 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.7)", "pid": 1336759, "tid": 1336759, "ts": 1295650099900.397, "dur": 18823.698, "args": { "External id": 13044,"Record function id": 0, "Ev Idx": 6539 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.7)", "pid": 1336759, "tid": 1336759, "ts": 1295650099908.704, "dur": 866.945, "args": { "External id": 13045,"Record function id": 0, "Ev Idx": 6540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650100021.663, "dur": 9.493, "args": { "External id": 13046,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650100046.530, "dur": 33.068, "args": { "External id": 13047,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100051.962, "dur": 2.236, "args": { "External id": 13048,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100058.379, "dur": 0.364, "args": { "External id": 13049,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100059.806, "dur": 0.341, "args": { "External id": 13050,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100061.861, "dur": 0.280, "args": { "External id": 13051,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100064.414, "dur": 0.223, "args": { "External id": 13052,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100066.090, "dur": 0.376, "args": { "External id": 13053,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100067.531, "dur": 2.885, "args": { "External id": 13054,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100071.848, "dur": 0.430, "args": { "External id": 13055,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100073.376, "dur": 0.328, "args": { "External id": 13056,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650100089.895, "dur": 42.219, "args": { "External id": 13057,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6552 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650100164.982, "dur": 122.324, "args": { "External id": 13058,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650100175.762, "dur": 3.469, "args": { "External id": 13059,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650100184.086, "dur": 10.444, "args": { "External id": 13060,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650100188.837, "dur": 5.274, "args": { "External id": 13061,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100192.329, "dur": 0.541, "args": { "External id": 13062,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650100200.609, "dur": 25.725, "args": { "External id": 13063,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100202.320, "dur": 2.613, "args": { "External id": 13064,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100206.700, "dur": 0.252, "args": { "External id": 13065,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6560 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100207.897, "dur": 0.426, "args": { "External id": 13066,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100211.689, "dur": 1.074, "args": { "External id": 13067,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100213.718, "dur": 0.159, "args": { "External id": 13068,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100215.149, "dur": 0.172, "args": { "External id": 13069,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100217.879, "dur": 0.157, "args": { "External id": 13070,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6565 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100219.342, "dur": 0.186, "args": { "External id": 13071,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650100220.495, "dur": 2.151, "args": { "External id": 13072,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650100254.225, "dur": 25.359, "args": { "External id": 13073,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6568 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650100341.051, "dur": 346.530, "args": { "External id": 13074,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6569 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650100374.391, "dur": 308.537, "args": { "External id": 13075,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6570, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650100386.303, "dur": 291.798, "args": { "External id": 13076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6571 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650100710.476, "dur": 2.128, "args": { "External id": 13077,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6572, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.7)", "pid": 1336759, "tid": 1336759, "ts": 1295650100795.673, "dur": 17741.928, "args": { "External id": 13078,"Record function id": 0, "Ev Idx": 6573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650100892.598, "dur": 6.200, "args": { "External id": 13079,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650100901.927, "dur": 1.035, "args": { "External id": 13080,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650100904.775, "dur": 2.122, "args": { "External id": 13081,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650100909.992, "dur": 0.783, "args": { "External id": 13082,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650100912.067, "dur": 0.730, "args": { "External id": 13083,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650100914.054, "dur": 0.756, "args": { "External id": 13084,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650100916.594, "dur": 0.783, "args": { "External id": 13085,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650100920.253, "dur": 1.470, "args": { "External id": 13086,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650100923.170, "dur": 0.458, "args": { "External id": 13087,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650100924.783, "dur": 0.639, "args": { "External id": 13088,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6583 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650100944.549, "dur": 17552.288, "args": { "External id": 13089,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650100958.911, "dur": 17531.020, "args": { "External id": 13090,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650100978.617, "dur": 55.533, "args": { "External id": 13091,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650101040.291, "dur": 17418.345, "args": { "External id": 13092,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650101042.663, "dur": 17415.390, "args": { "External id": 13093,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650101047.958, "dur": 5.777, "args": { "External id": 13094,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650101055.179, "dur": 17399.767, "args": { "External id": 13095,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6590 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650118663.249, "dur": 36.680, "args": { "External id": 13096,"Sequence number": 246555, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6591 } }, { "ph": "s", "id": 213, "pid": 1336759, "tid": 1336759, "ts": 1295650118663.249, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650118687.184, "dur": 7.855, "args": { "External id": 13097,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650118690.346, "dur": 4.473, "args": { "External id": 13098,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6593 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650118762.768, "dur": 76.123, "args": { "External id": 13099,"Record function id": 0, "Ev Idx": 6594 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650118840.439, "dur": 1045.374, "args": { "External id": 13100,"Record function id": 0, "Ev Idx": 6595 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650118881.453, "dur": 991.803, "args": { "External id": 13101,"Sequence number": 246556, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6596 } }, { "ph": "s", "id": 212, "pid": 1336759, "tid": 1336759, "ts": 1295650118881.453, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650118948.932, "dur": 73.555, "args": { "External id": 13102,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650119038.396, "dur": 103.915, "args": { "External id": 13103,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650119152.231, "dur": 37.493, "args": { "External id": 13104,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650119198.430, "dur": 45.082, "args": { "External id": 13105,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6600 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650119274.177, "dur": 26.156, "args": { "External id": 13106,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6601 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650119317.069, "dur": 14.161, "args": { "External id": 13107,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6602 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650119349.552, "dur": 129.062, "args": { "External id": 13108,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650119397.629, "dur": 11.491, "args": { "External id": 13109,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650119402.562, "dur": 5.670, "args": { "External id": 13110,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650119411.851, "dur": 5.116, "args": { "External id": 13111,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650119423.273, "dur": 1.273, "args": { "External id": 13112,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650119426.957, "dur": 3.959, "args": { "External id": 13113,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650119489.856, "dur": 48.368, "args": { "External id": 13114,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6609 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650119569.473, "dur": 24.431, "args": { "External id": 13115,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650119601.992, "dur": 40.873, "args": { "External id": 13116,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650119651.210, "dur": 34.159, "args": { "External id": 13117,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6612 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650119706.488, "dur": 23.856, "args": { "External id": 13118,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650119736.039, "dur": 32.759, "args": { "External id": 13119,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6614 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650119790.916, "dur": 17.033, "args": { "External id": 13120,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6615 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.7)", "pid": 1336759, "tid": 1336759, "ts": 1295650119949.338, "dur": 114.917, "args": { "External id": 13121,"Record function id": 0, "Ev Idx": 6616 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650120143.124, "dur": 47.706, "args": { "External id": 13122,"Record function id": 0, "Ev Idx": 6617 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.8)", "pid": 1336759, "tid": 1336759, "ts": 1295650120199.067, "dur": 18719.925, "args": { "External id": 13123,"Record function id": 0, "Ev Idx": 6618 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.8)", "pid": 1336759, "tid": 1336759, "ts": 1295650120208.235, "dur": 861.136, "args": { "External id": 13124,"Record function id": 0, "Ev Idx": 6619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650120299.918, "dur": 9.188, "args": { "External id": 13125,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650120322.713, "dur": 33.279, "args": { "External id": 13126,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120328.232, "dur": 2.368, "args": { "External id": 13127,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120334.821, "dur": 0.507, "args": { "External id": 13128,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120336.541, "dur": 0.275, "args": { "External id": 13129,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120338.165, "dur": 0.359, "args": { "External id": 13130,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120341.434, "dur": 0.342, "args": { "External id": 13131,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120343.106, "dur": 0.343, "args": { "External id": 13132,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120344.772, "dur": 2.946, "args": { "External id": 13133,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120349.086, "dur": 0.186, "args": { "External id": 13134,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120350.402, "dur": 0.189, "args": { "External id": 13135,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650120367.243, "dur": 43.432, "args": { "External id": 13136,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6631 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650120443.528, "dur": 102.394, "args": { "External id": 13137,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650120453.623, "dur": 4.232, "args": { "External id": 13138,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650120462.774, "dur": 10.621, "args": { "External id": 13139,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650120467.589, "dur": 5.376, "args": { "External id": 13140,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120471.201, "dur": 0.520, "args": { "External id": 13141,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650120479.405, "dur": 25.477, "args": { "External id": 13142,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120481.333, "dur": 2.535, "args": { "External id": 13143,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120485.188, "dur": 0.440, "args": { "External id": 13144,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120486.955, "dur": 0.263, "args": { "External id": 13145,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120490.354, "dur": 1.397, "args": { "External id": 13146,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120492.884, "dur": 0.166, "args": { "External id": 13147,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6642 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120494.303, "dur": 0.159, "args": { "External id": 13148,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120496.725, "dur": 0.267, "args": { "External id": 13149,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120498.028, "dur": 0.160, "args": { "External id": 13150,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650120499.217, "dur": 1.784, "args": { "External id": 13151,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650120514.785, "dur": 23.138, "args": { "External id": 13152,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6647 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650120596.211, "dur": 338.329, "args": { "External id": 13153,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6648 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650120626.079, "dur": 303.469, "args": { "External id": 13154,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6649, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650120637.416, "dur": 287.473, "args": { "External id": 13155,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6650 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650120957.074, "dur": 2.158, "args": { "External id": 13156,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6651, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.8)", "pid": 1336759, "tid": 1336759, "ts": 1295650121091.466, "dur": 17644.336, "args": { "External id": 13157,"Record function id": 0, "Ev Idx": 6652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650121186.998, "dur": 7.013, "args": { "External id": 13158,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650121197.078, "dur": 0.972, "args": { "External id": 13159,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650121199.727, "dur": 2.083, "args": { "External id": 13160,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650121203.703, "dur": 0.550, "args": { "External id": 13161,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650121205.583, "dur": 0.913, "args": { "External id": 13162,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650121207.716, "dur": 0.594, "args": { "External id": 13163,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650121211.143, "dur": 0.693, "args": { "External id": 13164,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650121213.562, "dur": 1.822, "args": { "External id": 13165,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650121216.876, "dur": 0.542, "args": { "External id": 13166,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650121218.897, "dur": 0.587, "args": { "External id": 13167,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6662 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650121264.211, "dur": 17432.546, "args": { "External id": 13168,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650121281.721, "dur": 17408.585, "args": { "External id": 13169,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650121302.376, "dur": 13.501, "args": { "External id": 13170,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650121318.957, "dur": 17340.331, "args": { "External id": 13171,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650121321.243, "dur": 17337.331, "args": { "External id": 13172,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650121326.715, "dur": 6.122, "args": { "External id": 13173,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650121334.642, "dur": 17320.858, "args": { "External id": 13174,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6669 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650138862.937, "dur": 32.607, "args": { "External id": 13175,"Sequence number": 246557, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6670 } }, { "ph": "s", "id": 211, "pid": 1336759, "tid": 1336759, "ts": 1295650138862.937, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650138883.378, "dur": 7.389, "args": { "External id": 13176,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650138886.438, "dur": 4.176, "args": { "External id": 13177,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6672 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650138955.842, "dur": 108.758, "args": { "External id": 13178,"Record function id": 0, "Ev Idx": 6673 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650139067.698, "dur": 1034.560, "args": { "External id": 13179,"Record function id": 0, "Ev Idx": 6674 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650139107.548, "dur": 980.852, "args": { "External id": 13180,"Sequence number": 246558, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6675 } }, { "ph": "s", "id": 210, "pid": 1336759, "tid": 1336759, "ts": 1295650139107.548, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650139174.810, "dur": 41.869, "args": { "External id": 13181,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650139245.754, "dur": 104.325, "args": { "External id": 13182,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6677 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650139361.309, "dur": 37.384, "args": { "External id": 13183,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650139407.126, "dur": 30.575, "args": { "External id": 13184,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6679 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650139463.300, "dur": 25.114, "args": { "External id": 13185,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6680 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650139506.054, "dur": 14.201, "args": { "External id": 13186,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6681 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650139538.529, "dur": 123.574, "args": { "External id": 13187,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650139585.175, "dur": 11.461, "args": { "External id": 13188,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650139589.911, "dur": 5.927, "args": { "External id": 13189,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650139599.143, "dur": 5.746, "args": { "External id": 13190,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650139606.232, "dur": 1.282, "args": { "External id": 13191,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650139609.851, "dur": 3.889, "args": { "External id": 13192,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650139672.656, "dur": 45.472, "args": { "External id": 13193,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6688 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650139746.323, "dur": 25.848, "args": { "External id": 13194,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650139779.903, "dur": 39.337, "args": { "External id": 13195,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650139827.537, "dur": 33.545, "args": { "External id": 13196,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6691 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650139883.281, "dur": 23.918, "args": { "External id": 13197,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650139912.627, "dur": 33.405, "args": { "External id": 13198,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6693 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650139964.796, "dur": 52.119, "args": { "External id": 13199,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6694 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.8)", "pid": 1336759, "tid": 1336759, "ts": 1295650140166.449, "dur": 90.729, "args": { "External id": 13200,"Record function id": 0, "Ev Idx": 6695 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650140333.315, "dur": 49.194, "args": { "External id": 13201,"Record function id": 0, "Ev Idx": 6696 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.9)", "pid": 1336759, "tid": 1336759, "ts": 1295650140390.974, "dur": 18686.369, "args": { "External id": 13202,"Record function id": 0, "Ev Idx": 6697 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.9)", "pid": 1336759, "tid": 1336759, "ts": 1295650140400.124, "dur": 930.153, "args": { "External id": 13203,"Record function id": 0, "Ev Idx": 6698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650140479.983, "dur": 9.109, "args": { "External id": 13204,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650140502.039, "dur": 32.720, "args": { "External id": 13205,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140507.353, "dur": 2.400, "args": { "External id": 13206,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140513.759, "dur": 0.400, "args": { "External id": 13207,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140515.719, "dur": 0.331, "args": { "External id": 13208,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140517.203, "dur": 0.251, "args": { "External id": 13209,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140520.399, "dur": 0.190, "args": { "External id": 13210,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140521.557, "dur": 0.216, "args": { "External id": 13211,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140523.332, "dur": 2.948, "args": { "External id": 13212,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140527.425, "dur": 0.260, "args": { "External id": 13213,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140528.925, "dur": 0.375, "args": { "External id": 13214,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650140546.164, "dur": 42.663, "args": { "External id": 13215,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6710 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650140619.417, "dur": 111.385, "args": { "External id": 13216,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650140629.586, "dur": 4.013, "args": { "External id": 13217,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650140638.222, "dur": 9.704, "args": { "External id": 13218,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650140642.618, "dur": 4.892, "args": { "External id": 13219,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140645.971, "dur": 0.480, "args": { "External id": 13220,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650140654.044, "dur": 28.027, "args": { "External id": 13221,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140655.744, "dur": 1.992, "args": { "External id": 13222,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140662.518, "dur": 0.345, "args": { "External id": 13223,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6718 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140664.102, "dur": 0.243, "args": { "External id": 13224,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140666.995, "dur": 1.270, "args": { "External id": 13225,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6720 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140669.337, "dur": 0.185, "args": { "External id": 13226,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140670.571, "dur": 1.994, "args": { "External id": 13227,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140673.694, "dur": 0.170, "args": { "External id": 13228,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140674.990, "dur": 0.155, "args": { "External id": 13229,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650140678.376, "dur": 0.204, "args": { "External id": 13230,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650140699.501, "dur": 23.479, "args": { "External id": 13231,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6726 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650140784.645, "dur": 424.023, "args": { "External id": 13232,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6727 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650140813.569, "dur": 389.215, "args": { "External id": 13233,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6728, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650140825.650, "dur": 371.583, "args": { "External id": 13234,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6729 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650141249.927, "dur": 3.557, "args": { "External id": 13235,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6730, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.9)", "pid": 1336759, "tid": 1336759, "ts": 1295650141351.522, "dur": 17507.860, "args": { "External id": 13236,"Record function id": 0, "Ev Idx": 6731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650141448.886, "dur": 6.887, "args": { "External id": 13237,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650141459.005, "dur": 1.100, "args": { "External id": 13238,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650141461.686, "dur": 2.659, "args": { "External id": 13239,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650141466.009, "dur": 1.012, "args": { "External id": 13240,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650141468.275, "dur": 0.774, "args": { "External id": 13241,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650141470.231, "dur": 0.647, "args": { "External id": 13242,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650141474.342, "dur": 0.603, "args": { "External id": 13243,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650141476.504, "dur": 1.714, "args": { "External id": 13244,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650141479.592, "dur": 0.912, "args": { "External id": 13245,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650141482.198, "dur": 0.524, "args": { "External id": 13246,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6741 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650141502.349, "dur": 17318.326, "args": { "External id": 13247,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650141517.998, "dur": 17295.862, "args": { "External id": 13248,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650141539.835, "dur": 14.714, "args": { "External id": 13249,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650141557.318, "dur": 17225.577, "args": { "External id": 13250,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650141559.468, "dur": 17222.765, "args": { "External id": 13251,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650141565.308, "dur": 5.471, "args": { "External id": 13252,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650141572.558, "dur": 17206.579, "args": { "External id": 13253,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6748 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650159013.263, "dur": 37.008, "args": { "External id": 13254,"Sequence number": 246559, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6749 } }, { "ph": "s", "id": 209, "pid": 1336759, "tid": 1336759, "ts": 1295650159013.263, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650159037.119, "dur": 7.891, "args": { "External id": 13255,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650159040.403, "dur": 4.274, "args": { "External id": 13256,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6751 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650159115.664, "dur": 77.290, "args": { "External id": 13257,"Record function id": 0, "Ev Idx": 6752 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650159194.711, "dur": 1046.367, "args": { "External id": 13258,"Record function id": 0, "Ev Idx": 6753 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650159248.793, "dur": 965.533, "args": { "External id": 13259,"Sequence number": 246560, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6754 } }, { "ph": "s", "id": 208, "pid": 1336759, "tid": 1336759, "ts": 1295650159248.793, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650159316.950, "dur": 43.839, "args": { "External id": 13260,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650159373.434, "dur": 103.332, "args": { "External id": 13261,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650159486.142, "dur": 37.436, "args": { "External id": 13262,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650159531.453, "dur": 32.024, "args": { "External id": 13263,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6758 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650159586.241, "dur": 23.825, "args": { "External id": 13264,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6759 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650159625.828, "dur": 13.280, "args": { "External id": 13265,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6760 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650159656.150, "dur": 119.560, "args": { "External id": 13266,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650159701.755, "dur": 11.232, "args": { "External id": 13267,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650159706.864, "dur": 5.346, "args": { "External id": 13268,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650159715.599, "dur": 5.054, "args": { "External id": 13269,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650159721.827, "dur": 1.336, "args": { "External id": 13270,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650159725.434, "dur": 3.947, "args": { "External id": 13271,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650159785.887, "dur": 43.064, "args": { "External id": 13272,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6767 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650159857.339, "dur": 25.896, "args": { "External id": 13273,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650159897.349, "dur": 40.507, "args": { "External id": 13274,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650159946.429, "dur": 33.386, "args": { "External id": 13275,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6770 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650160043.089, "dur": 26.910, "args": { "External id": 13276,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650160076.636, "dur": 37.989, "args": { "External id": 13277,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6772 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650160134.498, "dur": 17.520, "args": { "External id": 13278,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6773 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.9)", "pid": 1336759, "tid": 1336759, "ts": 1295650160307.671, "dur": 71.812, "args": { "External id": 13279,"Record function id": 0, "Ev Idx": 6774 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650160451.131, "dur": 45.916, "args": { "External id": 13280,"Record function id": 0, "Ev Idx": 6775 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.10)", "pid": 1336759, "tid": 1336759, "ts": 1295650160505.126, "dur": 18420.307, "args": { "External id": 13281,"Record function id": 0, "Ev Idx": 6776 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.10)", "pid": 1336759, "tid": 1336759, "ts": 1295650160513.752, "dur": 961.807, "args": { "External id": 13282,"Record function id": 0, "Ev Idx": 6777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650160591.083, "dur": 8.368, "args": { "External id": 13283,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650160612.247, "dur": 33.218, "args": { "External id": 13284,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160617.808, "dur": 2.355, "args": { "External id": 13285,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160624.003, "dur": 0.275, "args": { "External id": 13286,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160625.553, "dur": 0.368, "args": { "External id": 13287,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160627.142, "dur": 0.357, "args": { "External id": 13288,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160630.934, "dur": 0.318, "args": { "External id": 13289,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160632.315, "dur": 0.264, "args": { "External id": 13290,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160633.812, "dur": 3.597, "args": { "External id": 13291,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160638.416, "dur": 0.180, "args": { "External id": 13292,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160639.897, "dur": 0.286, "args": { "External id": 13293,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650160655.012, "dur": 41.222, "args": { "External id": 13294,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6789 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650160728.076, "dur": 101.096, "args": { "External id": 13295,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650160738.361, "dur": 4.637, "args": { "External id": 13296,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650160747.901, "dur": 9.544, "args": { "External id": 13297,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650160752.094, "dur": 4.914, "args": { "External id": 13298,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160755.515, "dur": 0.399, "args": { "External id": 13299,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650160764.121, "dur": 25.321, "args": { "External id": 13300,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160765.861, "dur": 1.974, "args": { "External id": 13301,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160768.757, "dur": 0.392, "args": { "External id": 13302,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160770.571, "dur": 0.316, "args": { "External id": 13303,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160773.838, "dur": 1.416, "args": { "External id": 13304,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160776.498, "dur": 0.292, "args": { "External id": 13305,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160777.818, "dur": 0.281, "args": { "External id": 13306,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160781.179, "dur": 0.217, "args": { "External id": 13307,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160782.167, "dur": 0.426, "args": { "External id": 13308,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650160783.973, "dur": 1.945, "args": { "External id": 13309,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650160798.664, "dur": 23.152, "args": { "External id": 13310,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6805 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650160879.558, "dur": 491.036, "args": { "External id": 13311,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6806 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650160906.979, "dur": 457.423, "args": { "External id": 13312,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6807, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650160944.737, "dur": 413.224, "args": { "External id": 13313,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6808 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650161397.005, "dur": 2.760, "args": { "External id": 13314,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6809, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.10)", "pid": 1336759, "tid": 1336759, "ts": 1295650161496.850, "dur": 17241.709, "args": { "External id": 13315,"Record function id": 0, "Ev Idx": 6810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650161594.178, "dur": 6.749, "args": { "External id": 13316,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650161604.495, "dur": 0.825, "args": { "External id": 13317,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650161607.109, "dur": 1.952, "args": { "External id": 13318,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650161610.678, "dur": 0.711, "args": { "External id": 13319,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650161612.672, "dur": 0.654, "args": { "External id": 13320,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650161614.576, "dur": 0.624, "args": { "External id": 13321,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650161618.376, "dur": 0.852, "args": { "External id": 13322,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650161620.831, "dur": 1.752, "args": { "External id": 13323,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650161624.067, "dur": 0.704, "args": { "External id": 13324,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650161626.372, "dur": 0.627, "args": { "External id": 13325,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6820 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650161646.691, "dur": 17054.079, "args": { "External id": 13326,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650161663.017, "dur": 17031.111, "args": { "External id": 13327,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650161683.748, "dur": 13.387, "args": { "External id": 13328,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650161700.188, "dur": 16962.175, "args": { "External id": 13329,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650161702.481, "dur": 16959.138, "args": { "External id": 13330,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650161708.101, "dur": 5.530, "args": { "External id": 13331,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650161715.407, "dur": 16943.396, "args": { "External id": 13332,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6827 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650178868.153, "dur": 32.860, "args": { "External id": 13333,"Sequence number": 246561, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6828 } }, { "ph": "s", "id": 207, "pid": 1336759, "tid": 1336759, "ts": 1295650178868.153, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650178888.733, "dur": 7.317, "args": { "External id": 13334,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650178891.786, "dur": 4.056, "args": { "External id": 13335,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6830 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650178963.000, "dur": 106.240, "args": { "External id": 13336,"Record function id": 0, "Ev Idx": 6831 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650179072.336, "dur": 1032.452, "args": { "External id": 13337,"Record function id": 0, "Ev Idx": 6832 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650179112.904, "dur": 978.990, "args": { "External id": 13338,"Sequence number": 246562, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6833 } }, { "ph": "s", "id": 206, "pid": 1336759, "tid": 1336759, "ts": 1295650179112.904, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650179180.379, "dur": 42.113, "args": { "External id": 13339,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650179250.226, "dur": 105.185, "args": { "External id": 13340,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650179365.616, "dur": 36.884, "args": { "External id": 13341,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650179410.387, "dur": 30.432, "args": { "External id": 13342,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6837 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650179466.013, "dur": 24.523, "args": { "External id": 13343,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6838 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650179507.872, "dur": 14.576, "args": { "External id": 13344,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6839 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650179540.133, "dur": 123.039, "args": { "External id": 13345,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650179587.729, "dur": 11.090, "args": { "External id": 13346,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650179592.375, "dur": 5.655, "args": { "External id": 13347,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650179601.468, "dur": 5.567, "args": { "External id": 13348,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650179608.603, "dur": 1.346, "args": { "External id": 13349,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650179612.542, "dur": 3.496, "args": { "External id": 13350,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650179673.959, "dur": 43.018, "args": { "External id": 13351,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6846 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650179746.720, "dur": 27.763, "args": { "External id": 13352,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650179782.198, "dur": 40.030, "args": { "External id": 13353,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650179830.344, "dur": 33.657, "args": { "External id": 13354,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6849 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650179883.971, "dur": 24.698, "args": { "External id": 13355,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650179913.946, "dur": 33.600, "args": { "External id": 13356,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6851 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650179969.041, "dur": 53.612, "args": { "External id": 13357,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6852 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.10)", "pid": 1336759, "tid": 1336759, "ts": 1295650180167.560, "dur": 88.311, "args": { "External id": 13358,"Record function id": 0, "Ev Idx": 6853 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650180332.509, "dur": 46.859, "args": { "External id": 13359,"Record function id": 0, "Ev Idx": 6854 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.11)", "pid": 1336759, "tid": 1336759, "ts": 1295650180387.608, "dur": 18586.299, "args": { "External id": 13360,"Record function id": 0, "Ev Idx": 6855 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.11)", "pid": 1336759, "tid": 1336759, "ts": 1295650180396.546, "dur": 889.689, "args": { "External id": 13361,"Record function id": 0, "Ev Idx": 6856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650180473.562, "dur": 8.798, "args": { "External id": 13362,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650180495.424, "dur": 33.190, "args": { "External id": 13363,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180500.552, "dur": 2.175, "args": { "External id": 13364,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180507.356, "dur": 0.543, "args": { "External id": 13365,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180509.370, "dur": 0.367, "args": { "External id": 13366,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180511.282, "dur": 0.256, "args": { "External id": 13367,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180513.998, "dur": 0.299, "args": { "External id": 13368,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180516.128, "dur": 0.163, "args": { "External id": 13369,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180517.356, "dur": 2.841, "args": { "External id": 13370,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180521.658, "dur": 0.333, "args": { "External id": 13371,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180522.875, "dur": 0.293, "args": { "External id": 13372,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650180541.983, "dur": 43.174, "args": { "External id": 13373,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6868 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650180616.568, "dur": 103.159, "args": { "External id": 13374,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650180626.756, "dur": 5.281, "args": { "External id": 13375,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650180636.658, "dur": 10.446, "args": { "External id": 13376,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650180641.259, "dur": 5.472, "args": { "External id": 13377,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180644.751, "dur": 0.493, "args": { "External id": 13378,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650180653.233, "dur": 24.972, "args": { "External id": 13379,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180655.112, "dur": 0.511, "args": { "External id": 13380,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180657.307, "dur": 2.213, "args": { "External id": 13381,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180660.973, "dur": 0.355, "args": { "External id": 13382,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180662.764, "dur": 1.169, "args": { "External id": 13383,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180666.700, "dur": 0.200, "args": { "External id": 13384,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180668.378, "dur": 0.293, "args": { "External id": 13385,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180669.640, "dur": 0.400, "args": { "External id": 13386,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180673.089, "dur": 0.251, "args": { "External id": 13387,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650180674.440, "dur": 0.318, "args": { "External id": 13388,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650180688.639, "dur": 23.665, "args": { "External id": 13389,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6884 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650180770.232, "dur": 401.784, "args": { "External id": 13390,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6885 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650180799.008, "dur": 367.495, "args": { "External id": 13391,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6886, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650180810.901, "dur": 350.300, "args": { "External id": 13392,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6887 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650181196.817, "dur": 2.419, "args": { "External id": 13393,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6888, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.11)", "pid": 1336759, "tid": 1336759, "ts": 1295650181308.155, "dur": 17478.640, "args": { "External id": 13394,"Record function id": 0, "Ev Idx": 6889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650181404.293, "dur": 6.574, "args": { "External id": 13395,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650181414.255, "dur": 1.205, "args": { "External id": 13396,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650181417.345, "dur": 1.968, "args": { "External id": 13397,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650181420.936, "dur": 0.683, "args": { "External id": 13398,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650181422.955, "dur": 1.028, "args": { "External id": 13399,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650181425.103, "dur": 0.590, "args": { "External id": 13400,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650181429.098, "dur": 0.742, "args": { "External id": 13401,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650181431.148, "dur": 1.788, "args": { "External id": 13402,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650181434.875, "dur": 0.775, "args": { "External id": 13403,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650181436.941, "dur": 0.625, "args": { "External id": 13404,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6899 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650181457.052, "dur": 17290.637, "args": { "External id": 13405,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650181472.961, "dur": 17268.094, "args": { "External id": 13406,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650181494.451, "dur": 13.130, "args": { "External id": 13407,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650181510.599, "dur": 17198.791, "args": { "External id": 13408,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650181513.138, "dur": 17195.613, "args": { "External id": 13409,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650181518.652, "dur": 5.443, "args": { "External id": 13410,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650181525.959, "dur": 17179.731, "args": { "External id": 13411,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6906 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650198913.591, "dur": 36.641, "args": { "External id": 13412,"Sequence number": 246563, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6907 } }, { "ph": "s", "id": 205, "pid": 1336759, "tid": 1336759, "ts": 1295650198913.591, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650198937.356, "dur": 7.681, "args": { "External id": 13413,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650198940.653, "dur": 4.147, "args": { "External id": 13414,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6909 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650199039.922, "dur": 78.951, "args": { "External id": 13415,"Record function id": 0, "Ev Idx": 6910 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650199121.039, "dur": 1041.276, "args": { "External id": 13416,"Record function id": 0, "Ev Idx": 6911 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650199162.261, "dur": 987.155, "args": { "External id": 13417,"Sequence number": 246564, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6912 } }, { "ph": "s", "id": 204, "pid": 1336759, "tid": 1336759, "ts": 1295650199162.261, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650199242.280, "dur": 42.700, "args": { "External id": 13418,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650199300.183, "dur": 103.639, "args": { "External id": 13419,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650199413.610, "dur": 38.166, "args": { "External id": 13420,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650199460.193, "dur": 30.285, "args": { "External id": 13421,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6916 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650199515.765, "dur": 22.947, "args": { "External id": 13422,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6917 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650199555.427, "dur": 13.714, "args": { "External id": 13423,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6918 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650199587.122, "dur": 122.715, "args": { "External id": 13424,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650199633.822, "dur": 10.620, "args": { "External id": 13425,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650199638.393, "dur": 5.274, "args": { "External id": 13426,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650199647.168, "dur": 5.375, "args": { "External id": 13427,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650199653.723, "dur": 1.305, "args": { "External id": 13428,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650199657.773, "dur": 3.683, "args": { "External id": 13429,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650199720.357, "dur": 45.179, "args": { "External id": 13430,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6925 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650199796.348, "dur": 26.668, "args": { "External id": 13431,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650199831.391, "dur": 39.927, "args": { "External id": 13432,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650199879.620, "dur": 34.266, "args": { "External id": 13433,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6928 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650199935.499, "dur": 23.750, "args": { "External id": 13434,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650199964.581, "dur": 75.170, "args": { "External id": 13435,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6930 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650200064.097, "dur": 18.575, "args": { "External id": 13436,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6931 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.11)", "pid": 1336759, "tid": 1336759, "ts": 1295650200225.661, "dur": 92.333, "args": { "External id": 13437,"Record function id": 0, "Ev Idx": 6932 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650200393.672, "dur": 48.227, "args": { "External id": 13438,"Record function id": 0, "Ev Idx": 6933 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.12)", "pid": 1336759, "tid": 1336759, "ts": 1295650200450.480, "dur": 18219.892, "args": { "External id": 13439,"Record function id": 0, "Ev Idx": 6934 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.12)", "pid": 1336759, "tid": 1336759, "ts": 1295650200458.631, "dur": 884.782, "args": { "External id": 13440,"Record function id": 0, "Ev Idx": 6935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650200535.618, "dur": 8.293, "args": { "External id": 13441,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650200559.399, "dur": 33.294, "args": { "External id": 13442,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200564.781, "dur": 2.407, "args": { "External id": 13443,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200571.111, "dur": 0.578, "args": { "External id": 13444,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200573.113, "dur": 0.412, "args": { "External id": 13445,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200574.677, "dur": 2.163, "args": { "External id": 13446,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200578.171, "dur": 0.308, "args": { "External id": 13447,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200579.622, "dur": 0.416, "args": { "External id": 13448,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200583.089, "dur": 1.316, "args": { "External id": 13449,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200585.704, "dur": 0.396, "args": { "External id": 13450,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200586.949, "dur": 0.185, "args": { "External id": 13451,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650200603.534, "dur": 42.652, "args": { "External id": 13452,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6947 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650200677.870, "dur": 99.537, "args": { "External id": 13453,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650200687.945, "dur": 4.082, "args": { "External id": 13454,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650200696.907, "dur": 11.154, "args": { "External id": 13455,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650200701.360, "dur": 6.268, "args": { "External id": 13456,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200704.522, "dur": 1.992, "args": { "External id": 13457,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650200714.410, "dur": 24.314, "args": { "External id": 13458,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200716.028, "dur": 0.331, "args": { "External id": 13459,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200717.728, "dur": 0.658, "args": { "External id": 13460,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200719.510, "dur": 0.315, "args": { "External id": 13461,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200723.357, "dur": 1.135, "args": { "External id": 13462,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200725.825, "dur": 0.157, "args": { "External id": 13463,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200727.174, "dur": 2.091, "args": { "External id": 13464,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200730.247, "dur": 0.375, "args": { "External id": 13465,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200731.740, "dur": 0.183, "args": { "External id": 13466,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650200734.950, "dur": 0.166, "args": { "External id": 13467,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650200747.281, "dur": 22.929, "args": { "External id": 13468,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6963 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650200828.177, "dur": 413.637, "args": { "External id": 13469,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6964 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650200858.474, "dur": 362.987, "args": { "External id": 13470,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6965, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650200868.195, "dur": 347.285, "args": { "External id": 13471,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6966 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650201270.833, "dur": 2.997, "args": { "External id": 13472,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6967, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.12)", "pid": 1336759, "tid": 1336759, "ts": 1295650201363.761, "dur": 17113.902, "args": { "External id": 13473,"Record function id": 0, "Ev Idx": 6968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650201459.036, "dur": 6.364, "args": { "External id": 13474,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650201468.921, "dur": 1.111, "args": { "External id": 13475,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650201471.611, "dur": 1.927, "args": { "External id": 13476,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650201475.208, "dur": 0.672, "args": { "External id": 13477,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650201477.200, "dur": 0.760, "args": { "External id": 13478,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650201479.206, "dur": 0.824, "args": { "External id": 13479,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650201483.046, "dur": 0.629, "args": { "External id": 13480,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650201485.376, "dur": 1.652, "args": { "External id": 13481,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650201488.538, "dur": 0.860, "args": { "External id": 13482,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650201491.168, "dur": 0.609, "args": { "External id": 13483,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6978 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650201510.572, "dur": 16924.443, "args": { "External id": 13484,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650201525.783, "dur": 16902.739, "args": { "External id": 13485,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650201547.452, "dur": 14.623, "args": { "External id": 13486,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650201565.079, "dur": 16830.272, "args": { "External id": 13487,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650201567.863, "dur": 16826.817, "args": { "External id": 13488,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650201573.910, "dur": 5.184, "args": { "External id": 13489,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650201580.820, "dur": 16811.069, "args": { "External id": 13490,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6985 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650218610.579, "dur": 34.492, "args": { "External id": 13491,"Sequence number": 246565, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6986 } }, { "ph": "s", "id": 203, "pid": 1336759, "tid": 1336759, "ts": 1295650218610.579, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650218632.062, "dur": 8.061, "args": { "External id": 13492,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650218635.395, "dur": 4.461, "args": { "External id": 13493,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6988 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650218707.578, "dur": 73.414, "args": { "External id": 13494,"Record function id": 0, "Ev Idx": 6989 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650218782.544, "dur": 1033.045, "args": { "External id": 13495,"Record function id": 0, "Ev Idx": 6990 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650218821.936, "dur": 981.033, "args": { "External id": 13496,"Sequence number": 246566, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6991 } }, { "ph": "s", "id": 202, "pid": 1336759, "tid": 1336759, "ts": 1295650218821.936, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650218884.829, "dur": 39.565, "args": { "External id": 13497,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650218936.753, "dur": 131.980, "args": { "External id": 13498,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650219083.294, "dur": 40.662, "args": { "External id": 13499,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650219132.301, "dur": 30.722, "args": { "External id": 13500,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6995 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650219188.950, "dur": 23.354, "args": { "External id": 13501,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6996 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650219242.891, "dur": 16.739, "args": { "External id": 13502,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6997 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650219279.149, "dur": 126.825, "args": { "External id": 13503,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650219329.191, "dur": 11.435, "args": { "External id": 13504,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650219333.887, "dur": 6.090, "args": { "External id": 13505,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650219343.277, "dur": 5.146, "args": { "External id": 13506,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650219349.767, "dur": 1.379, "args": { "External id": 13507,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650219353.343, "dur": 4.103, "args": { "External id": 13508,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650219416.681, "dur": 48.055, "args": { "External id": 13509,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7004 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650219495.244, "dur": 24.810, "args": { "External id": 13510,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650219528.735, "dur": 40.254, "args": { "External id": 13511,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650219576.793, "dur": 33.971, "args": { "External id": 13512,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7007 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650219638.862, "dur": 25.222, "args": { "External id": 13513,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650219671.709, "dur": 33.713, "args": { "External id": 13514,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7009 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650219722.894, "dur": 17.135, "args": { "External id": 13515,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7010 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.12)", "pid": 1336759, "tid": 1336759, "ts": 1295650219877.275, "dur": 71.004, "args": { "External id": 13516,"Record function id": 0, "Ev Idx": 7011 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650220064.666, "dur": 48.254, "args": { "External id": 13517,"Record function id": 0, "Ev Idx": 7012 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.13)", "pid": 1336759, "tid": 1336759, "ts": 1295650220121.940, "dur": 18420.359, "args": { "External id": 13518,"Record function id": 0, "Ev Idx": 7013 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.13)", "pid": 1336759, "tid": 1336759, "ts": 1295650220130.185, "dur": 822.328, "args": { "External id": 13519,"Record function id": 0, "Ev Idx": 7014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650220206.802, "dur": 9.406, "args": { "External id": 13520,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7015 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650220245.414, "dur": 33.323, "args": { "External id": 13521,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220251.012, "dur": 2.376, "args": { "External id": 13522,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220257.475, "dur": 0.483, "args": { "External id": 13523,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7018 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220259.430, "dur": 0.383, "args": { "External id": 13524,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220260.908, "dur": 0.355, "args": { "External id": 13525,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220263.857, "dur": 0.404, "args": { "External id": 13526,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220265.206, "dur": 0.372, "args": { "External id": 13527,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220266.792, "dur": 3.117, "args": { "External id": 13528,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220270.703, "dur": 0.342, "args": { "External id": 13529,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220272.683, "dur": 0.298, "args": { "External id": 13530,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650220289.375, "dur": 43.575, "args": { "External id": 13531,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7026 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650220366.423, "dur": 104.062, "args": { "External id": 13532,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650220377.359, "dur": 4.421, "args": { "External id": 13533,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650220386.802, "dur": 9.952, "args": { "External id": 13534,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650220391.331, "dur": 5.028, "args": { "External id": 13535,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220394.743, "dur": 0.435, "args": { "External id": 13536,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650220404.304, "dur": 24.477, "args": { "External id": 13537,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220405.895, "dur": 2.034, "args": { "External id": 13538,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220409.009, "dur": 0.315, "args": { "External id": 13539,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220410.685, "dur": 0.404, "args": { "External id": 13540,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220413.843, "dur": 1.218, "args": { "External id": 13541,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220416.160, "dur": 0.322, "args": { "External id": 13542,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220417.333, "dur": 0.144, "args": { "External id": 13543,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220420.187, "dur": 0.293, "args": { "External id": 13544,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220421.631, "dur": 0.292, "args": { "External id": 13545,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650220423.094, "dur": 2.202, "args": { "External id": 13546,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650220439.975, "dur": 23.667, "args": { "External id": 13547,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7042 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650220522.430, "dur": 341.893, "args": { "External id": 13548,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7043 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650220553.885, "dur": 305.520, "args": { "External id": 13549,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7044, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650220564.763, "dur": 287.678, "args": { "External id": 13550,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7045 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650220884.923, "dur": 1.938, "args": { "External id": 13551,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7046, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.13)", "pid": 1336759, "tid": 1336759, "ts": 1295650220972.189, "dur": 17377.362, "args": { "External id": 13552,"Record function id": 0, "Ev Idx": 7047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650221114.557, "dur": 7.047, "args": { "External id": 13553,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650221125.076, "dur": 1.199, "args": { "External id": 13554,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650221127.905, "dur": 1.938, "args": { "External id": 13555,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650221131.409, "dur": 0.715, "args": { "External id": 13556,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650221133.474, "dur": 0.890, "args": { "External id": 13557,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650221137.148, "dur": 0.765, "args": { "External id": 13558,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650221139.330, "dur": 0.590, "args": { "External id": 13559,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650221141.295, "dur": 1.551, "args": { "External id": 13560,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650221144.009, "dur": 0.813, "args": { "External id": 13561,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650221148.149, "dur": 0.853, "args": { "External id": 13562,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7057 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650221166.823, "dur": 17143.754, "args": { "External id": 13563,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650221182.397, "dur": 17121.773, "args": { "External id": 13564,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650221204.959, "dur": 13.415, "args": { "External id": 13565,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650221221.430, "dur": 17050.817, "args": { "External id": 13566,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650221224.032, "dur": 17047.676, "args": { "External id": 13567,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650221246.696, "dur": 6.506, "args": { "External id": 13568,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650221255.405, "dur": 17013.411, "args": { "External id": 13569,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7064 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650238481.086, "dur": 34.145, "args": { "External id": 13570,"Sequence number": 246567, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7065 } }, { "ph": "s", "id": 201, "pid": 1336759, "tid": 1336759, "ts": 1295650238481.086, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650238502.930, "dur": 7.448, "args": { "External id": 13571,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650238506.118, "dur": 4.018, "args": { "External id": 13572,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7067 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650238580.770, "dur": 76.491, "args": { "External id": 13573,"Record function id": 0, "Ev Idx": 7068 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650238658.777, "dur": 1037.698, "args": { "External id": 13574,"Record function id": 0, "Ev Idx": 7069 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650238696.225, "dur": 986.860, "args": { "External id": 13575,"Sequence number": 246568, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7070 } }, { "ph": "s", "id": 200, "pid": 1336759, "tid": 1336759, "ts": 1295650238696.225, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650238758.367, "dur": 39.360, "args": { "External id": 13576,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650238809.524, "dur": 103.831, "args": { "External id": 13577,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650238922.655, "dur": 38.036, "args": { "External id": 13578,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650238969.059, "dur": 69.931, "args": { "External id": 13579,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7074 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650239067.436, "dur": 26.525, "args": { "External id": 13580,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7075 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650239110.527, "dur": 13.290, "args": { "External id": 13581,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7076 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650239141.808, "dur": 139.000, "args": { "External id": 13582,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650239188.030, "dur": 10.914, "args": { "External id": 13583,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650239192.739, "dur": 5.402, "args": { "External id": 13584,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650239201.615, "dur": 5.573, "args": { "External id": 13585,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650239208.460, "dur": 1.300, "args": { "External id": 13586,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650239211.902, "dur": 3.926, "args": { "External id": 13587,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650239292.765, "dur": 49.868, "args": { "External id": 13588,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7083 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650239373.606, "dur": 26.631, "args": { "External id": 13589,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650239409.103, "dur": 40.668, "args": { "External id": 13590,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650239457.555, "dur": 34.114, "args": { "External id": 13591,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7086 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650239513.762, "dur": 25.305, "args": { "External id": 13592,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650239544.983, "dur": 33.460, "args": { "External id": 13593,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7088 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650239596.792, "dur": 18.306, "args": { "External id": 13594,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7089 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.13)", "pid": 1336759, "tid": 1336759, "ts": 1295650239758.326, "dur": 73.649, "args": { "External id": 13595,"Record function id": 0, "Ev Idx": 7090 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650239907.135, "dur": 46.210, "args": { "External id": 13596,"Record function id": 0, "Ev Idx": 7091 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.14)", "pid": 1336759, "tid": 1336759, "ts": 1295650239962.833, "dur": 18371.335, "args": { "External id": 13597,"Record function id": 0, "Ev Idx": 7092 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.14)", "pid": 1336759, "tid": 1336759, "ts": 1295650239971.028, "dur": 940.794, "args": { "External id": 13598,"Record function id": 0, "Ev Idx": 7093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650240092.012, "dur": 9.004, "args": { "External id": 13599,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650240114.857, "dur": 40.142, "args": { "External id": 13600,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240124.979, "dur": 2.410, "args": { "External id": 13601,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240131.023, "dur": 0.325, "args": { "External id": 13602,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240132.437, "dur": 0.428, "args": { "External id": 13603,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240133.677, "dur": 2.373, "args": { "External id": 13604,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240137.225, "dur": 0.270, "args": { "External id": 13605,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240140.466, "dur": 0.339, "args": { "External id": 13606,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240144.151, "dur": 1.437, "args": { "External id": 13607,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240146.533, "dur": 0.239, "args": { "External id": 13608,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240147.785, "dur": 1.579, "args": { "External id": 13609,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650240165.800, "dur": 45.487, "args": { "External id": 13610,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7105 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650240259.460, "dur": 106.820, "args": { "External id": 13611,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650240270.363, "dur": 5.364, "args": { "External id": 13612,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650240281.002, "dur": 10.738, "args": { "External id": 13613,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650240285.368, "dur": 5.947, "args": { "External id": 13614,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240288.982, "dur": 0.713, "args": { "External id": 13615,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650240298.399, "dur": 24.132, "args": { "External id": 13616,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240300.280, "dur": 0.328, "args": { "External id": 13617,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240301.819, "dur": 0.501, "args": { "External id": 13618,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240303.603, "dur": 1.857, "args": { "External id": 13619,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240306.232, "dur": 1.695, "args": { "External id": 13620,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240309.378, "dur": 0.309, "args": { "External id": 13621,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240312.623, "dur": 0.196, "args": { "External id": 13622,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240314.201, "dur": 0.176, "args": { "External id": 13623,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240315.326, "dur": 0.282, "args": { "External id": 13624,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650240318.703, "dur": 0.261, "args": { "External id": 13625,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650240332.097, "dur": 26.399, "args": { "External id": 13626,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7121 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650240418.777, "dur": 394.151, "args": { "External id": 13627,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7122 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650240448.694, "dur": 359.014, "args": { "External id": 13628,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7123, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650240459.304, "dur": 342.640, "args": { "External id": 13629,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7124 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650240838.922, "dur": 2.313, "args": { "External id": 13630,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7125, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.14)", "pid": 1336759, "tid": 1336759, "ts": 1295650240931.995, "dur": 17201.307, "args": { "External id": 13631,"Record function id": 0, "Ev Idx": 7126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650241065.962, "dur": 7.081, "args": { "External id": 13632,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650241076.571, "dur": 0.903, "args": { "External id": 13633,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650241079.062, "dur": 2.077, "args": { "External id": 13634,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650241082.892, "dur": 0.787, "args": { "External id": 13635,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650241085.006, "dur": 0.872, "args": { "External id": 13636,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650241087.211, "dur": 1.019, "args": { "External id": 13637,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650241091.066, "dur": 0.834, "args": { "External id": 13638,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650241093.069, "dur": 1.625, "args": { "External id": 13639,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650241096.113, "dur": 0.619, "args": { "External id": 13640,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650241098.099, "dur": 0.613, "args": { "External id": 13641,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7136 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650241118.633, "dur": 16976.608, "args": { "External id": 13642,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650241134.248, "dur": 16954.127, "args": { "External id": 13643,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650241155.856, "dur": 13.461, "args": { "External id": 13644,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650241172.318, "dur": 16884.679, "args": { "External id": 13645,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650241174.806, "dur": 16881.701, "args": { "External id": 13646,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650241180.272, "dur": 5.359, "args": { "External id": 13647,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650241187.058, "dur": 16866.518, "args": { "External id": 13648,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7143 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650258275.048, "dur": 35.734, "args": { "External id": 13649,"Sequence number": 246569, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7144 } }, { "ph": "s", "id": 199, "pid": 1336759, "tid": 1336759, "ts": 1295650258275.048, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650258298.067, "dur": 7.548, "args": { "External id": 13650,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650258300.803, "dur": 4.424, "args": { "External id": 13651,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7146 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650258370.360, "dur": 77.430, "args": { "External id": 13652,"Record function id": 0, "Ev Idx": 7147 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650258449.058, "dur": 1058.267, "args": { "External id": 13653,"Record function id": 0, "Ev Idx": 7148 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650258486.506, "dur": 1007.908, "args": { "External id": 13654,"Sequence number": 246570, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7149 } }, { "ph": "s", "id": 198, "pid": 1336759, "tid": 1336759, "ts": 1295650258486.506, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650258553.607, "dur": 42.170, "args": { "External id": 13655,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650258607.378, "dur": 108.095, "args": { "External id": 13656,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650258725.135, "dur": 37.718, "args": { "External id": 13657,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650258770.980, "dur": 30.468, "args": { "External id": 13658,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7153 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650258825.977, "dur": 24.214, "args": { "External id": 13659,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7154 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650258868.017, "dur": 14.183, "args": { "External id": 13660,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7155 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650258898.892, "dur": 166.039, "args": { "External id": 13661,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650258947.687, "dur": 10.641, "args": { "External id": 13662,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650258952.195, "dur": 5.356, "args": { "External id": 13663,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650258961.173, "dur": 5.645, "args": { "External id": 13664,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650258967.886, "dur": 1.837, "args": { "External id": 13665,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650258971.904, "dur": 3.599, "args": { "External id": 13666,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650259077.691, "dur": 51.842, "args": { "External id": 13667,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7162 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650259162.429, "dur": 27.299, "args": { "External id": 13668,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650259198.696, "dur": 57.209, "args": { "External id": 13669,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650259267.427, "dur": 37.702, "args": { "External id": 13670,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7165 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650259326.571, "dur": 24.881, "args": { "External id": 13671,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650259357.210, "dur": 33.630, "args": { "External id": 13672,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7167 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650259412.457, "dur": 16.467, "args": { "External id": 13673,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7168 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.14)", "pid": 1336759, "tid": 1336759, "ts": 1295650259570.370, "dur": 73.760, "args": { "External id": 13674,"Record function id": 0, "Ev Idx": 7169 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650259718.174, "dur": 46.238, "args": { "External id": 13675,"Record function id": 0, "Ev Idx": 7170 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.15)", "pid": 1336759, "tid": 1336759, "ts": 1295650259772.674, "dur": 18302.355, "args": { "External id": 13676,"Record function id": 0, "Ev Idx": 7171 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.15)", "pid": 1336759, "tid": 1336759, "ts": 1295650259780.700, "dur": 912.509, "args": { "External id": 13677,"Record function id": 0, "Ev Idx": 7172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650259856.574, "dur": 8.009, "args": { "External id": 13678,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650259877.858, "dur": 33.720, "args": { "External id": 13679,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650259882.886, "dur": 2.455, "args": { "External id": 13680,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7175 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650259889.580, "dur": 0.279, "args": { "External id": 13681,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7176 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650259891.385, "dur": 0.313, "args": { "External id": 13682,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650259893.272, "dur": 0.324, "args": { "External id": 13683,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650259896.865, "dur": 0.285, "args": { "External id": 13684,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650259898.681, "dur": 0.235, "args": { "External id": 13685,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650259900.067, "dur": 2.521, "args": { "External id": 13686,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650259904.338, "dur": 0.173, "args": { "External id": 13687,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650259905.563, "dur": 0.272, "args": { "External id": 13688,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650259921.308, "dur": 38.677, "args": { "External id": 13689,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7184 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650260034.679, "dur": 121.946, "args": { "External id": 13690,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650260046.306, "dur": 5.690, "args": { "External id": 13691,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650260057.342, "dur": 11.484, "args": { "External id": 13692,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650260062.403, "dur": 5.979, "args": { "External id": 13693,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650260065.916, "dur": 0.840, "args": { "External id": 13694,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650260075.563, "dur": 27.239, "args": { "External id": 13695,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650260077.344, "dur": 2.560, "args": { "External id": 13696,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650260081.411, "dur": 0.581, "args": { "External id": 13697,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650260083.103, "dur": 0.468, "args": { "External id": 13698,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650260086.888, "dur": 1.336, "args": { "External id": 13699,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650260089.134, "dur": 0.491, "args": { "External id": 13700,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650260090.916, "dur": 0.220, "args": { "External id": 13701,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650260094.087, "dur": 0.296, "args": { "External id": 13702,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650260095.958, "dur": 0.143, "args": { "External id": 13703,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650260096.856, "dur": 2.271, "args": { "External id": 13704,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650260122.412, "dur": 26.299, "args": { "External id": 13705,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7200 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650260210.381, "dur": 387.101, "args": { "External id": 13706,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7201 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650260257.376, "dur": 334.681, "args": { "External id": 13707,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7202, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650260269.868, "dur": 316.438, "args": { "External id": 13708,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7203 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650260621.112, "dur": 2.552, "args": { "External id": 13709,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7204, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.15)", "pid": 1336759, "tid": 1336759, "ts": 1295650260713.623, "dur": 17140.632, "args": { "External id": 13710,"Record function id": 0, "Ev Idx": 7205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650260807.127, "dur": 6.524, "args": { "External id": 13711,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650260817.075, "dur": 0.944, "args": { "External id": 13712,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650260819.596, "dur": 2.046, "args": { "External id": 13713,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650260823.319, "dur": 0.745, "args": { "External id": 13714,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650260825.520, "dur": 0.704, "args": { "External id": 13715,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650260827.452, "dur": 0.932, "args": { "External id": 13716,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650260831.759, "dur": 1.147, "args": { "External id": 13717,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650260834.204, "dur": 1.902, "args": { "External id": 13718,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650260837.834, "dur": 0.595, "args": { "External id": 13719,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650260839.706, "dur": 0.571, "args": { "External id": 13720,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7215 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650260859.586, "dur": 16954.347, "args": { "External id": 13721,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650260874.663, "dur": 16932.383, "args": { "External id": 13722,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650260895.628, "dur": 12.829, "args": { "External id": 13723,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650260911.008, "dur": 16865.414, "args": { "External id": 13724,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650260913.717, "dur": 16861.999, "args": { "External id": 13725,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650260919.197, "dur": 5.104, "args": { "External id": 13726,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650260925.958, "dur": 16846.697, "args": { "External id": 13727,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7222 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650278010.424, "dur": 37.872, "args": { "External id": 13728,"Sequence number": 246571, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7223 } }, { "ph": "s", "id": 197, "pid": 1336759, "tid": 1336759, "ts": 1295650278010.424, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650278035.082, "dur": 7.944, "args": { "External id": 13729,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650278038.120, "dur": 4.513, "args": { "External id": 13730,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7225 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650278113.039, "dur": 75.754, "args": { "External id": 13731,"Record function id": 0, "Ev Idx": 7226 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650278190.391, "dur": 1036.242, "args": { "External id": 13732,"Record function id": 0, "Ev Idx": 7227 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650278244.317, "dur": 969.238, "args": { "External id": 13733,"Sequence number": 246572, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7228 } }, { "ph": "s", "id": 196, "pid": 1336759, "tid": 1336759, "ts": 1295650278244.317, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650278313.136, "dur": 43.213, "args": { "External id": 13734,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650278368.759, "dur": 103.611, "args": { "External id": 13735,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650278481.836, "dur": 38.159, "args": { "External id": 13736,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650278528.503, "dur": 29.961, "args": { "External id": 13737,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7232 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650278582.807, "dur": 23.160, "args": { "External id": 13738,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7233 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650278622.560, "dur": 13.423, "args": { "External id": 13739,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7234 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650278653.753, "dur": 123.045, "args": { "External id": 13740,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650278701.515, "dur": 11.193, "args": { "External id": 13741,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650278706.329, "dur": 5.511, "args": { "External id": 13742,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650278715.595, "dur": 5.355, "args": { "External id": 13743,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650278722.339, "dur": 1.283, "args": { "External id": 13744,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650278726.337, "dur": 3.753, "args": { "External id": 13745,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650278786.932, "dur": 42.879, "args": { "External id": 13746,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7241 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650278858.378, "dur": 25.756, "args": { "External id": 13747,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650278892.940, "dur": 39.410, "args": { "External id": 13748,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650278940.525, "dur": 34.044, "args": { "External id": 13749,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7244 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650279034.522, "dur": 27.422, "args": { "External id": 13750,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650279068.754, "dur": 38.095, "args": { "External id": 13751,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7246 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650279126.498, "dur": 17.988, "args": { "External id": 13752,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7247 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.15)", "pid": 1336759, "tid": 1336759, "ts": 1295650279306.945, "dur": 72.362, "args": { "External id": 13753,"Record function id": 0, "Ev Idx": 7248 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650279450.705, "dur": 45.959, "args": { "External id": 13754,"Record function id": 0, "Ev Idx": 7249 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.16)", "pid": 1336759, "tid": 1336759, "ts": 1295650279506.031, "dur": 18374.351, "args": { "External id": 13755,"Record function id": 0, "Ev Idx": 7250 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.16)", "pid": 1336759, "tid": 1336759, "ts": 1295650279514.282, "dur": 870.319, "args": { "External id": 13756,"Record function id": 0, "Ev Idx": 7251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650279591.814, "dur": 8.221, "args": { "External id": 13757,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650279612.681, "dur": 34.367, "args": { "External id": 13758,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279617.591, "dur": 2.273, "args": { "External id": 13759,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279624.503, "dur": 0.343, "args": { "External id": 13760,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279626.234, "dur": 0.369, "args": { "External id": 13761,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279628.061, "dur": 0.658, "args": { "External id": 13762,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279631.359, "dur": 0.434, "args": { "External id": 13763,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279633.205, "dur": 0.330, "args": { "External id": 13764,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279634.847, "dur": 3.135, "args": { "External id": 13765,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279639.372, "dur": 0.456, "args": { "External id": 13766,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279641.043, "dur": 0.248, "args": { "External id": 13767,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650279660.195, "dur": 41.582, "args": { "External id": 13768,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7263 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650279733.502, "dur": 100.137, "args": { "External id": 13769,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650279743.963, "dur": 5.367, "args": { "External id": 13770,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650279754.133, "dur": 10.008, "args": { "External id": 13771,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650279758.578, "dur": 5.108, "args": { "External id": 13772,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279761.909, "dur": 0.452, "args": { "External id": 13773,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650279770.351, "dur": 25.103, "args": { "External id": 13774,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279772.182, "dur": 0.523, "args": { "External id": 13775,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279774.148, "dur": 2.409, "args": { "External id": 13776,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279777.645, "dur": 0.482, "args": { "External id": 13777,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279779.295, "dur": 1.301, "args": { "External id": 13778,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279783.448, "dur": 0.171, "args": { "External id": 13779,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279784.816, "dur": 0.372, "args": { "External id": 13780,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279786.309, "dur": 0.392, "args": { "External id": 13781,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279789.896, "dur": 0.369, "args": { "External id": 13782,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650279791.167, "dur": 0.272, "args": { "External id": 13783,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650279804.576, "dur": 21.730, "args": { "External id": 13784,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7279 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650279883.591, "dur": 400.408, "args": { "External id": 13785,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7280 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650279913.728, "dur": 364.439, "args": { "External id": 13786,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7281, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650279923.569, "dur": 348.694, "args": { "External id": 13787,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7282 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650280310.759, "dur": 2.595, "args": { "External id": 13788,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7283, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.16)", "pid": 1336759, "tid": 1336759, "ts": 1295650280405.346, "dur": 17287.503, "args": { "External id": 13789,"Record function id": 0, "Ev Idx": 7284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650280500.794, "dur": 6.457, "args": { "External id": 13790,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650280510.702, "dur": 1.095, "args": { "External id": 13791,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650280513.470, "dur": 2.011, "args": { "External id": 13792,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650280517.084, "dur": 0.833, "args": { "External id": 13793,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650280519.320, "dur": 0.797, "args": { "External id": 13794,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650280521.436, "dur": 0.821, "args": { "External id": 13795,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650280525.068, "dur": 0.829, "args": { "External id": 13796,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650280527.947, "dur": 1.438, "args": { "External id": 13797,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650280530.692, "dur": 0.607, "args": { "External id": 13798,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650280532.618, "dur": 0.441, "args": { "External id": 13799,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7294 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650280552.947, "dur": 17101.604, "args": { "External id": 13800,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650280567.628, "dur": 17080.101, "args": { "External id": 13801,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650280589.194, "dur": 12.874, "args": { "External id": 13802,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650280604.979, "dur": 17010.716, "args": { "External id": 13803,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650280607.400, "dur": 17007.767, "args": { "External id": 13804,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650280612.824, "dur": 4.792, "args": { "External id": 13805,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650280619.165, "dur": 16992.933, "args": { "External id": 13806,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7301 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650297823.072, "dur": 33.397, "args": { "External id": 13807,"Sequence number": 246573, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7302 } }, { "ph": "s", "id": 195, "pid": 1336759, "tid": 1336759, "ts": 1295650297823.072, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650297844.529, "dur": 7.223, "args": { "External id": 13808,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650297847.542, "dur": 4.022, "args": { "External id": 13809,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7304 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650297918.253, "dur": 104.236, "args": { "External id": 13810,"Record function id": 0, "Ev Idx": 7305 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650298025.557, "dur": 1084.225, "args": { "External id": 13811,"Record function id": 0, "Ev Idx": 7306 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650298068.208, "dur": 1028.153, "args": { "External id": 13812,"Sequence number": 246574, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7307 } }, { "ph": "s", "id": 194, "pid": 1336759, "tid": 1336759, "ts": 1295650298068.208, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650298134.783, "dur": 41.051, "args": { "External id": 13813,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650298188.041, "dur": 120.610, "args": { "External id": 13814,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650298321.894, "dur": 38.271, "args": { "External id": 13815,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650298368.142, "dur": 30.803, "args": { "External id": 13816,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7311 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650298429.714, "dur": 26.105, "args": { "External id": 13817,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7312 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650298471.285, "dur": 14.966, "args": { "External id": 13818,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7313 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650298504.546, "dur": 128.902, "args": { "External id": 13819,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650298555.150, "dur": 11.514, "args": { "External id": 13820,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650298559.905, "dur": 5.902, "args": { "External id": 13821,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650298569.431, "dur": 5.422, "args": { "External id": 13822,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650298576.686, "dur": 1.148, "args": { "External id": 13823,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650298580.106, "dur": 5.579, "args": { "External id": 13824,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650298670.321, "dur": 44.984, "args": { "External id": 13825,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7320 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650298748.572, "dur": 27.976, "args": { "External id": 13826,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650298785.142, "dur": 40.703, "args": { "External id": 13827,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650298834.153, "dur": 34.516, "args": { "External id": 13828,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7323 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650298889.080, "dur": 25.204, "args": { "External id": 13829,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650298919.662, "dur": 32.995, "args": { "External id": 13830,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7325 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650298972.557, "dur": 54.702, "args": { "External id": 13831,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7326 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.16)", "pid": 1336759, "tid": 1336759, "ts": 1295650299174.648, "dur": 89.130, "args": { "External id": 13832,"Record function id": 0, "Ev Idx": 7327 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650299339.784, "dur": 48.621, "args": { "External id": 13833,"Record function id": 0, "Ev Idx": 7328 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.17)", "pid": 1336759, "tid": 1336759, "ts": 1295650299396.732, "dur": 18254.228, "args": { "External id": 13834,"Record function id": 0, "Ev Idx": 7329 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.17)", "pid": 1336759, "tid": 1336759, "ts": 1295650299404.940, "dur": 925.122, "args": { "External id": 13835,"Record function id": 0, "Ev Idx": 7330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650299481.836, "dur": 9.433, "args": { "External id": 13836,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650299504.201, "dur": 32.707, "args": { "External id": 13837,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299509.804, "dur": 2.349, "args": { "External id": 13838,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299516.415, "dur": 0.591, "args": { "External id": 13839,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299518.497, "dur": 0.515, "args": { "External id": 13840,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299520.011, "dur": 0.390, "args": { "External id": 13841,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299522.911, "dur": 0.430, "args": { "External id": 13842,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299524.084, "dur": 0.202, "args": { "External id": 13843,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299525.418, "dur": 3.128, "args": { "External id": 13844,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299529.950, "dur": 0.287, "args": { "External id": 13845,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299531.349, "dur": 0.288, "args": { "External id": 13846,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650299547.001, "dur": 43.265, "args": { "External id": 13847,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7342 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650299621.716, "dur": 102.385, "args": { "External id": 13848,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650299631.849, "dur": 4.329, "args": { "External id": 13849,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650299640.728, "dur": 9.986, "args": { "External id": 13850,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650299645.299, "dur": 5.008, "args": { "External id": 13851,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299648.578, "dur": 0.618, "args": { "External id": 13852,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650299657.196, "dur": 25.085, "args": { "External id": 13853,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299658.987, "dur": 2.010, "args": { "External id": 13854,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299661.944, "dur": 0.446, "args": { "External id": 13855,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299663.616, "dur": 0.334, "args": { "External id": 13856,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299666.956, "dur": 1.463, "args": { "External id": 13857,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299669.602, "dur": 0.503, "args": { "External id": 13858,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299671.117, "dur": 0.158, "args": { "External id": 13859,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299673.984, "dur": 0.207, "args": { "External id": 13860,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299675.239, "dur": 0.185, "args": { "External id": 13861,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650299676.454, "dur": 1.962, "args": { "External id": 13862,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650299693.077, "dur": 23.934, "args": { "External id": 13863,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7358 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650299773.966, "dur": 441.172, "args": { "External id": 13864,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7359 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650299802.817, "dur": 407.001, "args": { "External id": 13865,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7360, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650299812.829, "dur": 391.029, "args": { "External id": 13866,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7361 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650300255.191, "dur": 3.015, "args": { "External id": 13867,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7362, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.17)", "pid": 1336759, "tid": 1336759, "ts": 1295650300349.976, "dur": 17113.636, "args": { "External id": 13868,"Record function id": 0, "Ev Idx": 7363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650300444.737, "dur": 6.636, "args": { "External id": 13869,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650300454.641, "dur": 0.913, "args": { "External id": 13870,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650300457.119, "dur": 2.092, "args": { "External id": 13871,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650300461.192, "dur": 0.916, "args": { "External id": 13872,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650300463.751, "dur": 0.664, "args": { "External id": 13873,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650300466.132, "dur": 0.896, "args": { "External id": 13874,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650300470.685, "dur": 0.647, "args": { "External id": 13875,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650300473.093, "dur": 1.432, "args": { "External id": 13876,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650300475.904, "dur": 0.604, "args": { "External id": 13877,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650300477.974, "dur": 0.716, "args": { "External id": 13878,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7373 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650300497.939, "dur": 16926.003, "args": { "External id": 13879,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650300513.236, "dur": 16903.478, "args": { "External id": 13880,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650300535.221, "dur": 14.224, "args": { "External id": 13881,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650300552.334, "dur": 16831.659, "args": { "External id": 13882,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650300555.223, "dur": 16828.238, "args": { "External id": 13883,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650300560.814, "dur": 5.058, "args": { "External id": 13884,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650300567.873, "dur": 16812.125, "args": { "External id": 13885,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7380 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650317591.525, "dur": 34.401, "args": { "External id": 13886,"Sequence number": 246575, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7381 } }, { "ph": "s", "id": 193, "pid": 1336759, "tid": 1336759, "ts": 1295650317591.525, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650317613.215, "dur": 7.822, "args": { "External id": 13887,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650317616.362, "dur": 4.477, "args": { "External id": 13888,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7383 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650317689.739, "dur": 77.382, "args": { "External id": 13889,"Record function id": 0, "Ev Idx": 7384 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650317768.777, "dur": 1052.496, "args": { "External id": 13890,"Record function id": 0, "Ev Idx": 7385 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650317807.470, "dur": 1000.786, "args": { "External id": 13891,"Sequence number": 246576, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7386 } }, { "ph": "s", "id": 192, "pid": 1336759, "tid": 1336759, "ts": 1295650317807.470, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650317875.745, "dur": 40.527, "args": { "External id": 13892,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650317928.548, "dur": 132.734, "args": { "External id": 13893,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650318075.033, "dur": 41.984, "args": { "External id": 13894,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650318125.503, "dur": 30.850, "args": { "External id": 13895,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7390 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650318182.699, "dur": 25.135, "args": { "External id": 13896,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7391 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650318224.489, "dur": 30.961, "args": { "External id": 13897,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7392 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650318276.412, "dur": 127.053, "args": { "External id": 13898,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650318325.156, "dur": 12.158, "args": { "External id": 13899,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650318330.053, "dur": 6.219, "args": { "External id": 13900,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650318340.112, "dur": 5.344, "args": { "External id": 13901,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650318346.968, "dur": 1.258, "args": { "External id": 13902,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650318350.714, "dur": 3.993, "args": { "External id": 13903,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650318413.485, "dur": 51.389, "args": { "External id": 13904,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7399 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650318497.266, "dur": 28.307, "args": { "External id": 13905,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650318534.286, "dur": 40.918, "args": { "External id": 13906,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650318583.488, "dur": 33.777, "args": { "External id": 13907,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7402 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650318641.100, "dur": 24.286, "args": { "External id": 13908,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650318670.621, "dur": 33.584, "args": { "External id": 13909,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7404 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650318723.734, "dur": 16.257, "args": { "External id": 13910,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7405 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.17)", "pid": 1336759, "tid": 1336759, "ts": 1295650318884.632, "dur": 70.149, "args": { "External id": 13911,"Record function id": 0, "Ev Idx": 7406 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650319074.895, "dur": 48.913, "args": { "External id": 13912,"Record function id": 0, "Ev Idx": 7407 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.18)", "pid": 1336759, "tid": 1336759, "ts": 1295650319133.042, "dur": 18386.621, "args": { "External id": 13913,"Record function id": 0, "Ev Idx": 7408 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.18)", "pid": 1336759, "tid": 1336759, "ts": 1295650319140.823, "dur": 825.080, "args": { "External id": 13914,"Record function id": 0, "Ev Idx": 7409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650319219.234, "dur": 24.819, "args": { "External id": 13915,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650319260.579, "dur": 33.049, "args": { "External id": 13916,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319266.137, "dur": 2.495, "args": { "External id": 13917,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319272.295, "dur": 0.235, "args": { "External id": 13918,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319273.835, "dur": 0.239, "args": { "External id": 13919,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319275.344, "dur": 0.232, "args": { "External id": 13920,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319278.623, "dur": 0.610, "args": { "External id": 13921,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319280.555, "dur": 0.557, "args": { "External id": 13922,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319281.991, "dur": 2.839, "args": { "External id": 13923,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319285.978, "dur": 0.378, "args": { "External id": 13924,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319287.681, "dur": 0.154, "args": { "External id": 13925,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650319304.371, "dur": 43.546, "args": { "External id": 13926,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7421 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650319381.579, "dur": 107.693, "args": { "External id": 13927,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650319395.428, "dur": 6.569, "args": { "External id": 13928,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650319407.036, "dur": 10.050, "args": { "External id": 13929,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650319411.639, "dur": 5.036, "args": { "External id": 13930,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319414.853, "dur": 0.347, "args": { "External id": 13931,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650319423.373, "dur": 24.497, "args": { "External id": 13932,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319425.487, "dur": 0.481, "args": { "External id": 13933,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319427.337, "dur": 2.277, "args": { "External id": 13934,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319430.754, "dur": 0.220, "args": { "External id": 13935,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319431.708, "dur": 2.234, "args": { "External id": 13936,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319437.067, "dur": 0.249, "args": { "External id": 13937,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319438.208, "dur": 0.370, "args": { "External id": 13938,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319439.733, "dur": 0.301, "args": { "External id": 13939,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319442.747, "dur": 0.562, "args": { "External id": 13940,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650319444.323, "dur": 0.164, "args": { "External id": 13941,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650319457.739, "dur": 24.185, "args": { "External id": 13942,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7437 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650319542.863, "dur": 336.575, "args": { "External id": 13943,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7438 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650319574.423, "dur": 300.427, "args": { "External id": 13944,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7439, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650319584.440, "dur": 284.856, "args": { "External id": 13945,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7440 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650319901.275, "dur": 2.111, "args": { "External id": 13946,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7441, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.18)", "pid": 1336759, "tid": 1336759, "ts": 1295650320027.147, "dur": 17304.134, "args": { "External id": 13947,"Record function id": 0, "Ev Idx": 7442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650320127.217, "dur": 6.793, "args": { "External id": 13948,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650320137.619, "dur": 1.035, "args": { "External id": 13949,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650320140.412, "dur": 1.900, "args": { "External id": 13950,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650320144.239, "dur": 0.930, "args": { "External id": 13951,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650320146.485, "dur": 0.832, "args": { "External id": 13952,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650320148.663, "dur": 0.537, "args": { "External id": 13953,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650320152.589, "dur": 0.841, "args": { "External id": 13954,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650320154.945, "dur": 1.376, "args": { "External id": 13955,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650320157.986, "dur": 0.680, "args": { "External id": 13956,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650320160.033, "dur": 0.670, "args": { "External id": 13957,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7452 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650320180.115, "dur": 17111.326, "args": { "External id": 13958,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650320194.831, "dur": 17089.941, "args": { "External id": 13959,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650320216.047, "dur": 29.081, "args": { "External id": 13960,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650320248.888, "dur": 17005.159, "args": { "External id": 13961,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650320251.818, "dur": 17001.735, "args": { "External id": 13962,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650320257.103, "dur": 5.803, "args": { "External id": 13963,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650320264.347, "dur": 16986.366, "args": { "External id": 13964,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7459 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650337461.885, "dur": 33.180, "args": { "External id": 13965,"Sequence number": 246577, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7460 } }, { "ph": "s", "id": 191, "pid": 1336759, "tid": 1336759, "ts": 1295650337461.885, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650337482.725, "dur": 7.572, "args": { "External id": 13966,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650337485.913, "dur": 4.207, "args": { "External id": 13967,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7462 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650337558.651, "dur": 76.681, "args": { "External id": 13968,"Record function id": 0, "Ev Idx": 7463 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650337637.068, "dur": 1049.004, "args": { "External id": 13969,"Record function id": 0, "Ev Idx": 7464 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650337675.588, "dur": 997.072, "args": { "External id": 13970,"Sequence number": 246578, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7465 } }, { "ph": "s", "id": 190, "pid": 1336759, "tid": 1336759, "ts": 1295650337675.588, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650337744.699, "dur": 40.981, "args": { "External id": 13971,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650337799.372, "dur": 102.811, "args": { "External id": 13972,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650337911.403, "dur": 37.696, "args": { "External id": 13973,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650337955.305, "dur": 68.685, "args": { "External id": 13974,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7469 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650338054.737, "dur": 25.920, "args": { "External id": 13975,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7470 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650338095.766, "dur": 15.742, "args": { "External id": 13976,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7471 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650338128.454, "dur": 146.248, "args": { "External id": 13977,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650338180.070, "dur": 11.404, "args": { "External id": 13978,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7473 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650338185.243, "dur": 5.331, "args": { "External id": 13979,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650338194.141, "dur": 5.306, "args": { "External id": 13980,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650338200.627, "dur": 3.276, "args": { "External id": 13981,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650338206.397, "dur": 3.502, "args": { "External id": 13982,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650338286.250, "dur": 52.775, "args": { "External id": 13983,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7478 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650338369.313, "dur": 25.611, "args": { "External id": 13984,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650338403.188, "dur": 40.688, "args": { "External id": 13985,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650338450.592, "dur": 33.781, "args": { "External id": 13986,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7481 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650338508.636, "dur": 27.073, "args": { "External id": 13987,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650338541.091, "dur": 33.018, "args": { "External id": 13988,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7483 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650338591.436, "dur": 18.664, "args": { "External id": 13989,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7484 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.18)", "pid": 1336759, "tid": 1336759, "ts": 1295650338747.023, "dur": 69.742, "args": { "External id": 13990,"Record function id": 0, "Ev Idx": 7485 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650338887.652, "dur": 48.648, "args": { "External id": 13991,"Record function id": 0, "Ev Idx": 7486 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.19)", "pid": 1336759, "tid": 1336759, "ts": 1295650338945.911, "dur": 18379.648, "args": { "External id": 13992,"Record function id": 0, "Ev Idx": 7487 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.19)", "pid": 1336759, "tid": 1336759, "ts": 1295650338955.279, "dur": 926.307, "args": { "External id": 13993,"Record function id": 0, "Ev Idx": 7488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650339073.704, "dur": 9.470, "args": { "External id": 13994,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650339097.081, "dur": 32.960, "args": { "External id": 13995,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339102.572, "dur": 2.256, "args": { "External id": 13996,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339109.073, "dur": 0.240, "args": { "External id": 13997,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339110.389, "dur": 0.374, "args": { "External id": 13998,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339112.372, "dur": 0.484, "args": { "External id": 13999,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339115.300, "dur": 0.621, "args": { "External id": 14000,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339116.988, "dur": 0.510, "args": { "External id": 14001,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339118.645, "dur": 2.959, "args": { "External id": 14002,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339122.991, "dur": 0.160, "args": { "External id": 14003,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339124.111, "dur": 0.353, "args": { "External id": 14004,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650339140.793, "dur": 47.896, "args": { "External id": 14005,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7500 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650339222.195, "dur": 125.935, "args": { "External id": 14006,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650339250.581, "dur": 5.001, "args": { "External id": 14007,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650339260.960, "dur": 10.922, "args": { "External id": 14008,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650339265.527, "dur": 5.959, "args": { "External id": 14009,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7504 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339268.957, "dur": 0.762, "args": { "External id": 14010,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650339279.001, "dur": 24.291, "args": { "External id": 14011,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339281.013, "dur": 2.204, "args": { "External id": 14012,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339284.558, "dur": 0.262, "args": { "External id": 14013,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339286.109, "dur": 0.356, "args": { "External id": 14014,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339289.518, "dur": 1.426, "args": { "External id": 14015,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339292.151, "dur": 0.131, "args": { "External id": 14016,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339293.524, "dur": 0.415, "args": { "External id": 14017,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339295.942, "dur": 0.176, "args": { "External id": 14018,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339297.232, "dur": 0.166, "args": { "External id": 14019,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650339298.259, "dur": 1.787, "args": { "External id": 14020,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650339315.006, "dur": 25.122, "args": { "External id": 14021,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7516 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650339403.405, "dur": 387.712, "args": { "External id": 14022,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7517 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650339434.612, "dur": 351.491, "args": { "External id": 14023,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7518, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650339444.552, "dur": 335.951, "args": { "External id": 14024,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7519 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650339812.125, "dur": 2.110, "args": { "External id": 14025,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7520, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.19)", "pid": 1336759, "tid": 1336759, "ts": 1295650339900.887, "dur": 17219.556, "args": { "External id": 14026,"Record function id": 0, "Ev Idx": 7521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650340041.147, "dur": 6.630, "args": { "External id": 14027,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650340060.253, "dur": 0.898, "args": { "External id": 14028,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650340062.956, "dur": 1.873, "args": { "External id": 14029,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650340068.414, "dur": 0.784, "args": { "External id": 14030,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650340070.638, "dur": 0.603, "args": { "External id": 14031,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650340072.325, "dur": 0.497, "args": { "External id": 14032,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650340074.286, "dur": 0.601, "args": { "External id": 14033,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650340078.160, "dur": 1.796, "args": { "External id": 14034,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650340081.234, "dur": 0.438, "args": { "External id": 14035,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650340083.293, "dur": 0.479, "args": { "External id": 14036,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7531 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650340104.232, "dur": 16977.047, "args": { "External id": 14037,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650340120.782, "dur": 16954.038, "args": { "External id": 14038,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650340140.569, "dur": 12.899, "args": { "External id": 14039,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650340158.142, "dur": 16885.366, "args": { "External id": 14040,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650340160.379, "dur": 16882.442, "args": { "External id": 14041,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7536 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650340166.491, "dur": 5.084, "args": { "External id": 14042,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650340173.584, "dur": 16866.278, "args": { "External id": 14043,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7538 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650357261.600, "dur": 38.040, "args": { "External id": 14044,"Sequence number": 246579, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7539 } }, { "ph": "s", "id": 189, "pid": 1336759, "tid": 1336759, "ts": 1295650357261.600, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650357286.456, "dur": 7.779, "args": { "External id": 14045,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650357289.595, "dur": 4.302, "args": { "External id": 14046,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7541 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650357363.651, "dur": 75.173, "args": { "External id": 14047,"Record function id": 0, "Ev Idx": 7542 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650357440.575, "dur": 1036.423, "args": { "External id": 14048,"Record function id": 0, "Ev Idx": 7543 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650357476.941, "dur": 986.748, "args": { "External id": 14049,"Sequence number": 246580, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7544 } }, { "ph": "s", "id": 188, "pid": 1336759, "tid": 1336759, "ts": 1295650357476.941, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650357541.018, "dur": 42.244, "args": { "External id": 14050,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650357595.764, "dur": 103.747, "args": { "External id": 14051,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650357708.333, "dur": 38.117, "args": { "External id": 14052,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650357754.846, "dur": 31.101, "args": { "External id": 14053,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7548 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650357809.362, "dur": 24.999, "args": { "External id": 14054,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7549 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650357851.300, "dur": 13.448, "args": { "External id": 14055,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7550 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650357880.353, "dur": 161.582, "args": { "External id": 14056,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650357928.446, "dur": 10.685, "args": { "External id": 14057,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650357932.942, "dur": 5.422, "args": { "External id": 14058,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650357941.670, "dur": 5.223, "args": { "External id": 14059,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650357948.390, "dur": 1.652, "args": { "External id": 14060,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650357952.303, "dur": 2.434, "args": { "External id": 14061,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650358054.548, "dur": 51.035, "args": { "External id": 14062,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7557 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650358137.445, "dur": 26.479, "args": { "External id": 14063,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650358171.409, "dur": 39.985, "args": { "External id": 14064,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650358219.594, "dur": 49.540, "args": { "External id": 14065,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7560 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650358293.944, "dur": 25.499, "args": { "External id": 14066,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650358326.156, "dur": 34.963, "args": { "External id": 14067,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7562 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650358379.084, "dur": 17.759, "args": { "External id": 14068,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7563 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.19)", "pid": 1336759, "tid": 1336759, "ts": 1295650358538.029, "dur": 72.262, "args": { "External id": 14069,"Record function id": 0, "Ev Idx": 7564 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650358683.402, "dur": 45.225, "args": { "External id": 14070,"Record function id": 0, "Ev Idx": 7565 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.20)", "pid": 1336759, "tid": 1336759, "ts": 1295650358737.299, "dur": 18221.753, "args": { "External id": 14071,"Record function id": 0, "Ev Idx": 7566 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.20)", "pid": 1336759, "tid": 1336759, "ts": 1295650358746.927, "dur": 875.871, "args": { "External id": 14072,"Record function id": 0, "Ev Idx": 7567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650358821.830, "dur": 8.025, "args": { "External id": 14073,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650358842.065, "dur": 33.308, "args": { "External id": 14074,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650358847.315, "dur": 2.569, "args": { "External id": 14075,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650358854.135, "dur": 0.375, "args": { "External id": 14076,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7571 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650358855.974, "dur": 0.419, "args": { "External id": 14077,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650358857.795, "dur": 0.426, "args": { "External id": 14078,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650358861.188, "dur": 0.450, "args": { "External id": 14079,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650358862.744, "dur": 0.510, "args": { "External id": 14080,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650358864.258, "dur": 2.027, "args": { "External id": 14081,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650358867.485, "dur": 0.620, "args": { "External id": 14082,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650358869.460, "dur": 0.486, "args": { "External id": 14083,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650358885.790, "dur": 39.853, "args": { "External id": 14084,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7579 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650358955.926, "dur": 157.153, "args": { "External id": 14085,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650358966.246, "dur": 4.463, "args": { "External id": 14086,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650358975.582, "dur": 53.004, "args": { "External id": 14087,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650358980.044, "dur": 48.105, "args": { "External id": 14088,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650359025.598, "dur": 0.834, "args": { "External id": 14089,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650359037.142, "dur": 29.527, "args": { "External id": 14090,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650359039.008, "dur": 2.018, "args": { "External id": 14091,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650359042.288, "dur": 0.734, "args": { "External id": 14092,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650359047.594, "dur": 0.647, "args": { "External id": 14093,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650359050.676, "dur": 0.558, "args": { "External id": 14094,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650359052.520, "dur": 0.598, "args": { "External id": 14095,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650359054.214, "dur": 1.847, "args": { "External id": 14096,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650359057.332, "dur": 0.550, "args": { "External id": 14097,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650359058.981, "dur": 0.895, "args": { "External id": 14098,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650359062.741, "dur": 0.380, "args": { "External id": 14099,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650359076.945, "dur": 27.833, "args": { "External id": 14100,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7595 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650359166.088, "dur": 361.648, "args": { "External id": 14101,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7596 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650359198.530, "dur": 324.299, "args": { "External id": 14102,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7597, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650359208.855, "dur": 308.411, "args": { "External id": 14103,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7598 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650359552.071, "dur": 2.368, "args": { "External id": 14104,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7599, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.20)", "pid": 1336759, "tid": 1336759, "ts": 1295650359643.288, "dur": 17128.013, "args": { "External id": 14105,"Record function id": 0, "Ev Idx": 7600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650359737.793, "dur": 6.875, "args": { "External id": 14106,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650359747.911, "dur": 1.244, "args": { "External id": 14107,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650359750.902, "dur": 1.276, "args": { "External id": 14108,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650359753.813, "dur": 1.218, "args": { "External id": 14109,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650359756.484, "dur": 0.920, "args": { "External id": 14110,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650359758.608, "dur": 0.844, "args": { "External id": 14111,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650359762.903, "dur": 1.374, "args": { "External id": 14112,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650359765.744, "dur": 2.064, "args": { "External id": 14113,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650359769.148, "dur": 1.199, "args": { "External id": 14114,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650359771.632, "dur": 0.988, "args": { "External id": 14115,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7610 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650359791.179, "dur": 16942.201, "args": { "External id": 14116,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650359806.522, "dur": 16920.433, "args": { "External id": 14117,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650359827.786, "dur": 12.803, "args": { "External id": 14118,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650359843.435, "dur": 16852.839, "args": { "External id": 14119,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650359846.244, "dur": 16849.395, "args": { "External id": 14120,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650359851.358, "dur": 5.565, "args": { "External id": 14121,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650359858.701, "dur": 16833.922, "args": { "External id": 14122,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7617 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650376897.899, "dur": 37.867, "args": { "External id": 14123,"Sequence number": 246581, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7618 } }, { "ph": "s", "id": 187, "pid": 1336759, "tid": 1336759, "ts": 1295650376897.899, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650376923.376, "dur": 7.642, "args": { "External id": 14124,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650376926.695, "dur": 4.118, "args": { "External id": 14125,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7620 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650377022.523, "dur": 77.892, "args": { "External id": 14126,"Record function id": 0, "Ev Idx": 7621 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650377102.227, "dur": 1040.348, "args": { "External id": 14127,"Record function id": 0, "Ev Idx": 7622 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650377143.698, "dur": 985.991, "args": { "External id": 14128,"Sequence number": 246582, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7623 } }, { "ph": "s", "id": 186, "pid": 1336759, "tid": 1336759, "ts": 1295650377143.698, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650377211.131, "dur": 57.351, "args": { "External id": 14129,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650377283.553, "dur": 105.059, "args": { "External id": 14130,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650377398.966, "dur": 36.994, "args": { "External id": 14131,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650377442.243, "dur": 30.095, "args": { "External id": 14132,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7627 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650377498.495, "dur": 24.114, "args": { "External id": 14133,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7628 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650377537.435, "dur": 13.947, "args": { "External id": 14134,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7629 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650377567.903, "dur": 126.280, "args": { "External id": 14135,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650377616.404, "dur": 11.724, "args": { "External id": 14136,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650377621.168, "dur": 6.023, "args": { "External id": 14137,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650377630.804, "dur": 5.058, "args": { "External id": 14138,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650377637.153, "dur": 1.755, "args": { "External id": 14139,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650377643.256, "dur": 3.068, "args": { "External id": 14140,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650377706.063, "dur": 43.086, "args": { "External id": 14141,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7636 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650377779.026, "dur": 25.707, "args": { "External id": 14142,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650377812.705, "dur": 39.570, "args": { "External id": 14143,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650377859.242, "dur": 34.081, "args": { "External id": 14144,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7639 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650377915.424, "dur": 26.895, "args": { "External id": 14145,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650377947.916, "dur": 32.906, "args": { "External id": 14146,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7641 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650378042.451, "dur": 20.482, "args": { "External id": 14147,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7642 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.20)", "pid": 1336759, "tid": 1336759, "ts": 1295650378204.320, "dur": 91.067, "args": { "External id": 14148,"Record function id": 0, "Ev Idx": 7643 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650378372.187, "dur": 48.726, "args": { "External id": 14149,"Record function id": 0, "Ev Idx": 7644 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.21)", "pid": 1336759, "tid": 1336759, "ts": 1295650378429.699, "dur": 18332.955, "args": { "External id": 14150,"Record function id": 0, "Ev Idx": 7645 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.21)", "pid": 1336759, "tid": 1336759, "ts": 1295650378438.531, "dur": 900.056, "args": { "External id": 14151,"Record function id": 0, "Ev Idx": 7646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650378515.531, "dur": 8.999, "args": { "External id": 14152,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650378537.433, "dur": 32.798, "args": { "External id": 14153,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378542.760, "dur": 2.259, "args": { "External id": 14154,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378548.983, "dur": 0.574, "args": { "External id": 14155,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378550.658, "dur": 0.576, "args": { "External id": 14156,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378552.357, "dur": 0.590, "args": { "External id": 14157,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378555.517, "dur": 0.555, "args": { "External id": 14158,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378557.237, "dur": 0.464, "args": { "External id": 14159,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378558.824, "dur": 2.196, "args": { "External id": 14160,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378562.314, "dur": 0.807, "args": { "External id": 14161,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378563.943, "dur": 0.705, "args": { "External id": 14162,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650378579.960, "dur": 40.602, "args": { "External id": 14163,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7658 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650378652.108, "dur": 106.660, "args": { "External id": 14164,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650378662.202, "dur": 4.085, "args": { "External id": 14165,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650378671.077, "dur": 10.412, "args": { "External id": 14166,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650378675.448, "dur": 5.620, "args": { "External id": 14167,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378679.145, "dur": 0.617, "args": { "External id": 14168,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650378687.878, "dur": 27.478, "args": { "External id": 14169,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378689.706, "dur": 2.383, "args": { "External id": 14170,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378693.434, "dur": 0.451, "args": { "External id": 14171,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378695.252, "dur": 0.647, "args": { "External id": 14172,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378699.109, "dur": 0.708, "args": { "External id": 14173,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378700.893, "dur": 0.371, "args": { "External id": 14174,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378702.457, "dur": 0.554, "args": { "External id": 14175,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378705.913, "dur": 0.517, "args": { "External id": 14176,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378707.711, "dur": 0.793, "args": { "External id": 14177,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650378709.564, "dur": 1.983, "args": { "External id": 14178,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650378727.820, "dur": 23.681, "args": { "External id": 14179,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7674 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650378817.284, "dur": 404.030, "args": { "External id": 14180,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7675 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650378846.617, "dur": 369.232, "args": { "External id": 14181,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7676, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650378856.701, "dur": 351.464, "args": { "External id": 14182,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7677 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650379261.238, "dur": 3.548, "args": { "External id": 14183,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7678, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.21)", "pid": 1336759, "tid": 1336759, "ts": 1295650379358.822, "dur": 17214.145, "args": { "External id": 14184,"Record function id": 0, "Ev Idx": 7679 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650379455.382, "dur": 6.944, "args": { "External id": 14185,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650379465.663, "dur": 1.287, "args": { "External id": 14186,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650379468.746, "dur": 0.966, "args": { "External id": 14187,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650379471.318, "dur": 1.038, "args": { "External id": 14188,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650379473.966, "dur": 1.092, "args": { "External id": 14189,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650379478.545, "dur": 0.859, "args": { "External id": 14190,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650379481.173, "dur": 1.166, "args": { "External id": 14191,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650379483.716, "dur": 2.283, "args": { "External id": 14192,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650379487.544, "dur": 0.842, "args": { "External id": 14193,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650379491.851, "dur": 1.214, "args": { "External id": 14194,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7689 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650379510.825, "dur": 17021.488, "args": { "External id": 14195,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650379525.236, "dur": 17000.357, "args": { "External id": 14196,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650379547.327, "dur": 12.505, "args": { "External id": 14197,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650379562.777, "dur": 16929.334, "args": { "External id": 14198,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650379565.229, "dur": 16926.327, "args": { "External id": 14199,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7694 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650379571.161, "dur": 5.102, "args": { "External id": 14200,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650379577.919, "dur": 16910.866, "args": { "External id": 14201,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7696 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650396703.367, "dur": 33.069, "args": { "External id": 14202,"Sequence number": 246583, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7697 } }, { "ph": "s", "id": 185, "pid": 1336759, "tid": 1336759, "ts": 1295650396703.367, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650396724.113, "dur": 7.365, "args": { "External id": 14203,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650396726.820, "dur": 4.445, "args": { "External id": 14204,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7699 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650396802.019, "dur": 73.229, "args": { "External id": 14205,"Record function id": 0, "Ev Idx": 7700 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650396876.657, "dur": 1034.978, "args": { "External id": 14206,"Record function id": 0, "Ev Idx": 7701 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650396912.815, "dur": 985.851, "args": { "External id": 14207,"Sequence number": 246584, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7702 } }, { "ph": "s", "id": 184, "pid": 1336759, "tid": 1336759, "ts": 1295650396912.815, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650396976.434, "dur": 74.620, "args": { "External id": 14208,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650397067.520, "dur": 103.468, "args": { "External id": 14209,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650397179.840, "dur": 41.874, "args": { "External id": 14210,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650397246.799, "dur": 35.141, "args": { "External id": 14211,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7706 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650397309.240, "dur": 24.971, "args": { "External id": 14212,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7707 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650397351.621, "dur": 15.620, "args": { "External id": 14213,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7708 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650397384.649, "dur": 124.358, "args": { "External id": 14214,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650397433.749, "dur": 11.356, "args": { "External id": 14215,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650397438.626, "dur": 5.617, "args": { "External id": 14216,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650397447.424, "dur": 5.084, "args": { "External id": 14217,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650397453.765, "dur": 1.510, "args": { "External id": 14218,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650397457.848, "dur": 3.074, "args": { "External id": 14219,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650397519.907, "dur": 44.318, "args": { "External id": 14220,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7715 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650397593.496, "dur": 26.502, "args": { "External id": 14221,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650397627.929, "dur": 40.516, "args": { "External id": 14222,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650397676.789, "dur": 33.963, "args": { "External id": 14223,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7718 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650397733.493, "dur": 24.308, "args": { "External id": 14224,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650397763.705, "dur": 33.445, "args": { "External id": 14225,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7720 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650397817.284, "dur": 17.604, "args": { "External id": 14226,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7721 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.21)", "pid": 1336759, "tid": 1336759, "ts": 1295650397972.097, "dur": 113.062, "args": { "External id": 14227,"Record function id": 0, "Ev Idx": 7722 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650398161.797, "dur": 47.548, "args": { "External id": 14228,"Record function id": 0, "Ev Idx": 7723 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.22)", "pid": 1336759, "tid": 1336759, "ts": 1295650398218.103, "dur": 18285.285, "args": { "External id": 14229,"Record function id": 0, "Ev Idx": 7724 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.22)", "pid": 1336759, "tid": 1336759, "ts": 1295650398225.822, "dur": 904.384, "args": { "External id": 14230,"Record function id": 0, "Ev Idx": 7725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650398320.247, "dur": 8.893, "args": { "External id": 14231,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650398343.076, "dur": 31.501, "args": { "External id": 14232,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398348.354, "dur": 2.281, "args": { "External id": 14233,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7728 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398354.557, "dur": 0.520, "args": { "External id": 14234,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398356.149, "dur": 0.573, "args": { "External id": 14235,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398358.025, "dur": 0.602, "args": { "External id": 14236,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398361.257, "dur": 0.398, "args": { "External id": 14237,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398362.750, "dur": 0.738, "args": { "External id": 14238,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398364.195, "dur": 1.444, "args": { "External id": 14239,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398367.133, "dur": 0.515, "args": { "External id": 14240,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398368.587, "dur": 0.484, "args": { "External id": 14241,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650398384.961, "dur": 42.795, "args": { "External id": 14242,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7737 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650398460.894, "dur": 106.666, "args": { "External id": 14243,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650398470.964, "dur": 4.142, "args": { "External id": 14244,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650398479.926, "dur": 10.198, "args": { "External id": 14245,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650398484.507, "dur": 5.236, "args": { "External id": 14246,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398487.847, "dur": 0.722, "args": { "External id": 14247,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650398496.125, "dur": 28.817, "args": { "External id": 14248,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398497.816, "dur": 1.880, "args": { "External id": 14249,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398500.938, "dur": 0.439, "args": { "External id": 14250,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398502.152, "dur": 0.731, "args": { "External id": 14251,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398506.036, "dur": 0.485, "args": { "External id": 14252,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398507.642, "dur": 0.704, "args": { "External id": 14253,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398509.802, "dur": 0.668, "args": { "External id": 14254,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398512.550, "dur": 0.732, "args": { "External id": 14255,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398514.492, "dur": 0.799, "args": { "External id": 14256,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650398519.265, "dur": 1.973, "args": { "External id": 14257,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650398536.818, "dur": 23.035, "args": { "External id": 14258,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7753 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650398619.231, "dur": 359.055, "args": { "External id": 14259,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7754 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650398647.620, "dur": 325.207, "args": { "External id": 14260,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7755, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650398657.801, "dur": 309.405, "args": { "External id": 14261,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7756 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650399050.620, "dur": 3.299, "args": { "External id": 14262,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7757, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.22)", "pid": 1336759, "tid": 1336759, "ts": 1295650399151.518, "dur": 17159.175, "args": { "External id": 14263,"Record function id": 0, "Ev Idx": 7758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650399265.754, "dur": 7.308, "args": { "External id": 14264,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650399276.898, "dur": 1.196, "args": { "External id": 14265,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650399280.086, "dur": 1.284, "args": { "External id": 14266,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650399283.023, "dur": 0.852, "args": { "External id": 14267,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650399285.377, "dur": 0.984, "args": { "External id": 14268,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650399287.589, "dur": 1.041, "args": { "External id": 14269,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650399292.124, "dur": 1.090, "args": { "External id": 14270,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650399294.808, "dur": 2.207, "args": { "External id": 14271,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650399298.288, "dur": 1.025, "args": { "External id": 14272,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650399300.867, "dur": 1.124, "args": { "External id": 14273,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7768 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650399323.217, "dur": 16947.928, "args": { "External id": 14274,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650399344.183, "dur": 16920.029, "args": { "External id": 14275,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650399364.193, "dur": 13.283, "args": { "External id": 14276,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650399380.059, "dur": 16841.275, "args": { "External id": 14277,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650399382.792, "dur": 16837.975, "args": { "External id": 14278,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650399389.018, "dur": 6.243, "args": { "External id": 14279,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650399397.008, "dur": 16820.815, "args": { "External id": 14280,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7775 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650416443.773, "dur": 34.774, "args": { "External id": 14281,"Sequence number": 246585, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7776 } }, { "ph": "s", "id": 183, "pid": 1336759, "tid": 1336759, "ts": 1295650416443.773, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650416464.916, "dur": 8.195, "args": { "External id": 14282,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650416468.234, "dur": 4.593, "args": { "External id": 14283,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7778 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650416541.935, "dur": 73.683, "args": { "External id": 14284,"Record function id": 0, "Ev Idx": 7779 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650416617.163, "dur": 1055.073, "args": { "External id": 14285,"Record function id": 0, "Ev Idx": 7780 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650416654.205, "dur": 1004.584, "args": { "External id": 14286,"Sequence number": 246586, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7781 } }, { "ph": "s", "id": 182, "pid": 1336759, "tid": 1336759, "ts": 1295650416654.205, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650416719.853, "dur": 39.906, "args": { "External id": 14287,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650416772.279, "dur": 102.186, "args": { "External id": 14288,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650416883.137, "dur": 37.626, "args": { "External id": 14289,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650416929.605, "dur": 31.830, "args": { "External id": 14290,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7785 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650417024.446, "dur": 28.248, "args": { "External id": 14291,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7786 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650417072.694, "dur": 15.299, "args": { "External id": 14292,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7787 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650417105.145, "dur": 143.640, "args": { "External id": 14293,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650417156.029, "dur": 12.819, "args": { "External id": 14294,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650417160.783, "dur": 7.278, "args": { "External id": 14295,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650417171.543, "dur": 4.471, "args": { "External id": 14296,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650417177.458, "dur": 1.755, "args": { "External id": 14297,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650417181.398, "dur": 3.565, "args": { "External id": 14298,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650417261.087, "dur": 51.231, "args": { "External id": 14299,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7794 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650417344.887, "dur": 26.481, "args": { "External id": 14300,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650417379.608, "dur": 40.722, "args": { "External id": 14301,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650417429.823, "dur": 34.676, "args": { "External id": 14302,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7797 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650417486.930, "dur": 27.532, "args": { "External id": 14303,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650417521.172, "dur": 33.960, "args": { "External id": 14304,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7799 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650417576.046, "dur": 16.965, "args": { "External id": 14305,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7800 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.22)", "pid": 1336759, "tid": 1336759, "ts": 1295650417734.050, "dur": 72.400, "args": { "External id": 14306,"Record function id": 0, "Ev Idx": 7801 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650417879.304, "dur": 47.021, "args": { "External id": 14307,"Record function id": 0, "Ev Idx": 7802 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.23)", "pid": 1336759, "tid": 1336759, "ts": 1295650417934.827, "dur": 18206.722, "args": { "External id": 14308,"Record function id": 0, "Ev Idx": 7803 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.23)", "pid": 1336759, "tid": 1336759, "ts": 1295650417943.742, "dur": 928.846, "args": { "External id": 14309,"Record function id": 0, "Ev Idx": 7804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650418062.916, "dur": 10.379, "args": { "External id": 14310,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650418087.381, "dur": 34.712, "args": { "External id": 14311,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418092.814, "dur": 2.295, "args": { "External id": 14312,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418099.057, "dur": 0.905, "args": { "External id": 14313,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418101.257, "dur": 0.654, "args": { "External id": 14314,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418102.943, "dur": 0.416, "args": { "External id": 14315,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418106.837, "dur": 0.553, "args": { "External id": 14316,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418108.584, "dur": 0.636, "args": { "External id": 14317,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418110.414, "dur": 2.088, "args": { "External id": 14318,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418113.637, "dur": 0.794, "args": { "External id": 14319,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418115.719, "dur": 0.706, "args": { "External id": 14320,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650418132.075, "dur": 43.094, "args": { "External id": 14321,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7816 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650418208.931, "dur": 159.218, "args": { "External id": 14322,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650418219.156, "dur": 4.412, "args": { "External id": 14323,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650418243.524, "dur": 11.616, "args": { "External id": 14324,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650418248.107, "dur": 6.586, "args": { "External id": 14325,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418252.006, "dur": 0.954, "args": { "External id": 14326,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650418263.241, "dur": 29.972, "args": { "External id": 14327,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418265.375, "dur": 2.140, "args": { "External id": 14328,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418268.693, "dur": 0.948, "args": { "External id": 14329,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418270.881, "dur": 0.681, "args": { "External id": 14330,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418274.930, "dur": 0.994, "args": { "External id": 14331,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418277.117, "dur": 0.873, "args": { "External id": 14332,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418279.447, "dur": 1.083, "args": { "External id": 14333,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418283.575, "dur": 1.203, "args": { "External id": 14334,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418285.787, "dur": 0.874, "args": { "External id": 14335,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650418287.744, "dur": 2.013, "args": { "External id": 14336,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650418332.043, "dur": 27.153, "args": { "External id": 14337,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7832 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650418421.822, "dur": 357.170, "args": { "External id": 14338,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7833 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650418450.513, "dur": 323.520, "args": { "External id": 14339,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7834, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650418462.160, "dur": 306.104, "args": { "External id": 14340,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7835 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650418802.187, "dur": 2.045, "args": { "External id": 14341,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7836, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.23)", "pid": 1336759, "tid": 1336759, "ts": 1295650418891.821, "dur": 17032.809, "args": { "External id": 14342,"Record function id": 0, "Ev Idx": 7837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650419021.701, "dur": 6.840, "args": { "External id": 14343,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650419033.747, "dur": 1.561, "args": { "External id": 14344,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650419037.270, "dur": 1.106, "args": { "External id": 14345,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650419039.905, "dur": 1.136, "args": { "External id": 14346,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650419042.387, "dur": 0.885, "args": { "External id": 14347,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650419046.143, "dur": 1.048, "args": { "External id": 14348,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650419048.597, "dur": 0.967, "args": { "External id": 14349,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650419051.125, "dur": 2.008, "args": { "External id": 14350,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650419054.331, "dur": 0.632, "args": { "External id": 14351,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650419057.922, "dur": 0.826, "args": { "External id": 14352,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7847 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650419078.054, "dur": 16808.745, "args": { "External id": 14353,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650419093.540, "dur": 16786.472, "args": { "External id": 14354,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650419115.737, "dur": 12.249, "args": { "External id": 14355,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650419131.042, "dur": 16717.831, "args": { "External id": 14356,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650419133.793, "dur": 16714.595, "args": { "External id": 14357,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650419139.918, "dur": 5.773, "args": { "External id": 14358,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650419147.330, "dur": 16698.446, "args": { "External id": 14359,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7854 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650436079.629, "dur": 35.286, "args": { "External id": 14360,"Sequence number": 246587, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7855 } }, { "ph": "s", "id": 181, "pid": 1336759, "tid": 1336759, "ts": 1295650436079.629, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650436102.040, "dur": 7.626, "args": { "External id": 14361,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650436105.191, "dur": 4.118, "args": { "External id": 14362,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7857 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650436179.336, "dur": 88.532, "args": { "External id": 14363,"Record function id": 0, "Ev Idx": 7858 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650436270.959, "dur": 1069.865, "args": { "External id": 14364,"Record function id": 0, "Ev Idx": 7859 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650436312.645, "dur": 1014.803, "args": { "External id": 14365,"Sequence number": 246588, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7860 } }, { "ph": "s", "id": 180, "pid": 1336759, "tid": 1336759, "ts": 1295650436312.645, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650436380.461, "dur": 43.438, "args": { "External id": 14366,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650436436.887, "dur": 104.862, "args": { "External id": 14367,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650436550.576, "dur": 38.417, "args": { "External id": 14368,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650436597.430, "dur": 30.473, "args": { "External id": 14369,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7864 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650436653.006, "dur": 26.341, "args": { "External id": 14370,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7865 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650436697.812, "dur": 14.737, "args": { "External id": 14371,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7866 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650436729.303, "dur": 122.257, "args": { "External id": 14372,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650436777.314, "dur": 11.394, "args": { "External id": 14373,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650436782.279, "dur": 5.649, "args": { "External id": 14374,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650436791.463, "dur": 4.301, "args": { "External id": 14375,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650436797.414, "dur": 1.200, "args": { "External id": 14376,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650436801.027, "dur": 3.213, "args": { "External id": 14377,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650436861.650, "dur": 44.288, "args": { "External id": 14378,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7873 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650436936.040, "dur": 27.187, "args": { "External id": 14379,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650436971.746, "dur": 86.204, "args": { "External id": 14380,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650437070.696, "dur": 37.082, "args": { "External id": 14381,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7876 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650437138.216, "dur": 25.465, "args": { "External id": 14382,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650437169.388, "dur": 33.742, "args": { "External id": 14383,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7878 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650437224.197, "dur": 33.513, "args": { "External id": 14384,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7879 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.23)", "pid": 1336759, "tid": 1336759, "ts": 1295650437405.027, "dur": 74.698, "args": { "External id": 14385,"Record function id": 0, "Ev Idx": 7880 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650437554.793, "dur": 46.796, "args": { "External id": 14386,"Record function id": 0, "Ev Idx": 7881 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.24)", "pid": 1336759, "tid": 1336759, "ts": 1295650437610.895, "dur": 18229.039, "args": { "External id": 14387,"Record function id": 0, "Ev Idx": 7882 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.24)", "pid": 1336759, "tid": 1336759, "ts": 1295650437619.561, "dur": 875.631, "args": { "External id": 14388,"Record function id": 0, "Ev Idx": 7883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650437698.203, "dur": 8.324, "args": { "External id": 14389,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650437719.300, "dur": 35.311, "args": { "External id": 14390,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437725.075, "dur": 2.226, "args": { "External id": 14391,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437730.830, "dur": 0.977, "args": { "External id": 14392,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437733.349, "dur": 0.782, "args": { "External id": 14393,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437735.111, "dur": 0.803, "args": { "External id": 14394,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437739.379, "dur": 0.642, "args": { "External id": 14395,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437740.938, "dur": 0.928, "args": { "External id": 14396,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437743.147, "dur": 1.823, "args": { "External id": 14397,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437746.267, "dur": 0.816, "args": { "External id": 14398,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437748.394, "dur": 0.695, "args": { "External id": 14399,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650437765.151, "dur": 37.115, "args": { "External id": 14400,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7895 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650437834.708, "dur": 104.487, "args": { "External id": 14401,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650437844.795, "dur": 4.380, "args": { "External id": 14402,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650437853.951, "dur": 9.972, "args": { "External id": 14403,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650437858.380, "dur": 5.113, "args": { "External id": 14404,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437861.616, "dur": 0.629, "args": { "External id": 14405,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650437870.200, "dur": 28.941, "args": { "External id": 14406,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437871.881, "dur": 2.709, "args": { "External id": 14407,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437875.940, "dur": 0.948, "args": { "External id": 14408,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437878.311, "dur": 0.665, "args": { "External id": 14409,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437882.439, "dur": 0.371, "args": { "External id": 14410,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437884.186, "dur": 0.546, "args": { "External id": 14411,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437886.167, "dur": 0.611, "args": { "External id": 14412,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437889.673, "dur": 0.865, "args": { "External id": 14413,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437891.386, "dur": 0.829, "args": { "External id": 14414,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650437893.544, "dur": 1.974, "args": { "External id": 14415,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7910 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650437910.945, "dur": 20.620, "args": { "External id": 14416,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7911 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650438028.999, "dur": 368.267, "args": { "External id": 14417,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7912 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650438061.463, "dur": 330.748, "args": { "External id": 14418,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7913, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650438073.001, "dur": 312.744, "args": { "External id": 14419,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7914 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650438421.059, "dur": 2.100, "args": { "External id": 14420,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7915, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.24)", "pid": 1336759, "tid": 1336759, "ts": 1295650438515.561, "dur": 17135.750, "args": { "External id": 14421,"Record function id": 0, "Ev Idx": 7916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650438611.213, "dur": 6.493, "args": { "External id": 14422,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650438625.433, "dur": 1.572, "args": { "External id": 14423,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650438629.003, "dur": 1.040, "args": { "External id": 14424,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650438633.064, "dur": 0.945, "args": { "External id": 14425,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650438635.230, "dur": 1.017, "args": { "External id": 14426,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650438637.574, "dur": 0.881, "args": { "External id": 14427,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650438640.330, "dur": 0.808, "args": { "External id": 14428,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650438643.763, "dur": 2.187, "args": { "External id": 14429,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650438647.789, "dur": 0.684, "args": { "External id": 14430,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650438649.870, "dur": 1.215, "args": { "External id": 14431,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7926 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650438669.982, "dur": 16942.249, "args": { "External id": 14432,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650438685.747, "dur": 16919.744, "args": { "External id": 14433,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650438705.773, "dur": 13.556, "args": { "External id": 14434,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650438724.297, "dur": 16849.978, "args": { "External id": 14435,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650438726.659, "dur": 16846.878, "args": { "External id": 14436,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650438731.827, "dur": 6.019, "args": { "External id": 14437,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650438739.322, "dur": 16831.212, "args": { "External id": 14438,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7933 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650455781.485, "dur": 34.668, "args": { "External id": 14439,"Sequence number": 246589, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7934 } }, { "ph": "s", "id": 179, "pid": 1336759, "tid": 1336759, "ts": 1295650455781.485, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650455803.500, "dur": 7.713, "args": { "External id": 14440,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650455806.521, "dur": 4.452, "args": { "External id": 14441,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7936 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650455878.863, "dur": 72.534, "args": { "External id": 14442,"Record function id": 0, "Ev Idx": 7937 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650455952.714, "dur": 1017.562, "args": { "External id": 14443,"Record function id": 0, "Ev Idx": 7938 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650456023.374, "dur": 934.278, "args": { "External id": 14444,"Sequence number": 246590, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7939 } }, { "ph": "s", "id": 178, "pid": 1336759, "tid": 1336759, "ts": 1295650456023.374, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650456092.314, "dur": 42.947, "args": { "External id": 14445,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650456148.522, "dur": 105.699, "args": { "External id": 14446,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650456266.568, "dur": 40.195, "args": { "External id": 14447,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650456316.315, "dur": 30.581, "args": { "External id": 14448,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7943 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650456373.139, "dur": 24.777, "args": { "External id": 14449,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7944 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650456414.853, "dur": 15.017, "args": { "External id": 14450,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7945 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650456447.562, "dur": 123.551, "args": { "External id": 14451,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650456496.508, "dur": 11.425, "args": { "External id": 14452,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650456501.239, "dur": 5.842, "args": { "External id": 14453,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650456510.472, "dur": 5.034, "args": { "External id": 14454,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650456516.715, "dur": 1.609, "args": { "External id": 14455,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650456520.954, "dur": 3.150, "args": { "External id": 14456,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650456580.997, "dur": 43.010, "args": { "External id": 14457,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7952 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650456653.201, "dur": 24.810, "args": { "External id": 14458,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650456685.410, "dur": 39.137, "args": { "External id": 14459,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650456732.692, "dur": 33.796, "args": { "External id": 14460,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7955 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650456796.011, "dur": 25.371, "args": { "External id": 14461,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650456829.207, "dur": 33.666, "args": { "External id": 14462,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7957 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650456880.875, "dur": 16.096, "args": { "External id": 14463,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7958 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.24)", "pid": 1336759, "tid": 1336759, "ts": 1295650457071.856, "dur": 70.906, "args": { "External id": 14464,"Record function id": 0, "Ev Idx": 7959 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650457215.636, "dur": 65.876, "args": { "External id": 14465,"Record function id": 0, "Ev Idx": 7960 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.25)", "pid": 1336759, "tid": 1336759, "ts": 1295650457291.607, "dur": 18227.593, "args": { "External id": 14466,"Record function id": 0, "Ev Idx": 7961 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.25)", "pid": 1336759, "tid": 1336759, "ts": 1295650457301.002, "dur": 905.236, "args": { "External id": 14467,"Record function id": 0, "Ev Idx": 7962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650457378.102, "dur": 8.861, "args": { "External id": 14468,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650457399.805, "dur": 33.607, "args": { "External id": 14469,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457404.765, "dur": 2.124, "args": { "External id": 14470,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457411.101, "dur": 1.041, "args": { "External id": 14471,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457413.182, "dur": 0.718, "args": { "External id": 14472,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457415.491, "dur": 0.718, "args": { "External id": 14473,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457418.722, "dur": 0.488, "args": { "External id": 14474,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457420.567, "dur": 0.628, "args": { "External id": 14475,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457422.531, "dur": 1.865, "args": { "External id": 14476,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457425.840, "dur": 0.704, "args": { "External id": 14477,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457427.488, "dur": 0.663, "args": { "External id": 14478,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650457444.044, "dur": 39.189, "args": { "External id": 14479,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7974 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650457515.102, "dur": 106.059, "args": { "External id": 14480,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650457525.477, "dur": 4.719, "args": { "External id": 14481,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650457534.691, "dur": 10.119, "args": { "External id": 14482,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650457538.923, "dur": 5.500, "args": { "External id": 14483,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457542.259, "dur": 1.031, "args": { "External id": 14484,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650457551.278, "dur": 27.675, "args": { "External id": 14485,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457553.054, "dur": 2.314, "args": { "External id": 14486,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457557.365, "dur": 1.153, "args": { "External id": 14487,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457559.749, "dur": 0.429, "args": { "External id": 14488,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457563.763, "dur": 0.697, "args": { "External id": 14489,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457565.454, "dur": 0.486, "args": { "External id": 14490,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457567.123, "dur": 0.406, "args": { "External id": 14491,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457569.884, "dur": 0.551, "args": { "External id": 14492,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457571.808, "dur": 0.641, "args": { "External id": 14493,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650457573.534, "dur": 1.683, "args": { "External id": 14494,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650457591.711, "dur": 21.793, "args": { "External id": 14495,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7990 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650457671.421, "dur": 431.559, "args": { "External id": 14496,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7991 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650457699.260, "dur": 397.963, "args": { "External id": 14497,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7992, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650457709.473, "dur": 381.091, "args": { "External id": 14498,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7993 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650458127.876, "dur": 2.224, "args": { "External id": 14499,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7994, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.25)", "pid": 1336759, "tid": 1336759, "ts": 1295650458226.758, "dur": 17102.242, "args": { "External id": 14500,"Record function id": 0, "Ev Idx": 7995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650458346.782, "dur": 6.950, "args": { "External id": 14501,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650458357.129, "dur": 1.486, "args": { "External id": 14502,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650458360.251, "dur": 1.123, "args": { "External id": 14503,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650458362.855, "dur": 1.061, "args": { "External id": 14504,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650458365.408, "dur": 1.128, "args": { "External id": 14505,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650458367.727, "dur": 1.181, "args": { "External id": 14506,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650458372.124, "dur": 1.038, "args": { "External id": 14507,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 8002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650458374.650, "dur": 1.975, "args": { "External id": 14508,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650458378.159, "dur": 0.892, "args": { "External id": 14509,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650458380.580, "dur": 0.852, "args": { "External id": 14510,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8005 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650458402.093, "dur": 16888.639, "args": { "External id": 14511,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650458417.344, "dur": 16866.855, "args": { "External id": 14512,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650458440.671, "dur": 12.879, "args": { "External id": 14513,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650458456.801, "dur": 16796.496, "args": { "External id": 14514,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 8009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650458459.343, "dur": 16793.424, "args": { "External id": 14515,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 8010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650458464.674, "dur": 5.778, "args": { "External id": 14516,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650458472.299, "dur": 16777.521, "args": { "External id": 14517,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 8012 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650475460.657, "dur": 33.578, "args": { "External id": 14518,"Sequence number": 246591, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 8013 } }, { "ph": "s", "id": 177, "pid": 1336759, "tid": 1336759, "ts": 1295650475460.657, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650475475.894, "dur": 13.250, "args": { "External id": 14519,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 8014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650475484.642, "dur": 4.280, "args": { "External id": 14520,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8015 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650475556.745, "dur": 74.978, "args": { "External id": 14521,"Record function id": 0, "Ev Idx": 8016 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650475632.997, "dur": 1034.124, "args": { "External id": 14522,"Record function id": 0, "Ev Idx": 8017 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650475672.434, "dur": 981.568, "args": { "External id": 14523,"Sequence number": 246592, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 8018 } }, { "ph": "s", "id": 176, "pid": 1336759, "tid": 1336759, "ts": 1295650475672.434, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650475736.264, "dur": 39.129, "args": { "External id": 14524,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650475787.987, "dur": 100.573, "args": { "External id": 14525,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650475897.105, "dur": 36.271, "args": { "External id": 14526,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650475941.750, "dur": 30.757, "args": { "External id": 14527,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8022 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650476035.940, "dur": 28.042, "args": { "External id": 14528,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8023 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650476082.738, "dur": 14.143, "args": { "External id": 14529,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8024 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650476113.592, "dur": 137.951, "args": { "External id": 14530,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650476161.461, "dur": 12.577, "args": { "External id": 14531,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650476166.213, "dur": 6.976, "args": { "External id": 14532,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650476176.462, "dur": 4.294, "args": { "External id": 14533,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650476181.948, "dur": 1.612, "args": { "External id": 14534,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650476186.215, "dur": 3.493, "args": { "External id": 14535,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650476263.393, "dur": 51.232, "args": { "External id": 14536,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8031 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650476346.063, "dur": 27.486, "args": { "External id": 14537,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650476381.289, "dur": 39.917, "args": { "External id": 14538,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650476429.194, "dur": 33.752, "args": { "External id": 14539,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8034 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650476485.019, "dur": 29.013, "args": { "External id": 14540,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 8035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650476519.987, "dur": 32.960, "args": { "External id": 14541,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 8036 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650476571.150, "dur": 17.057, "args": { "External id": 14542,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 8037 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.25)", "pid": 1336759, "tid": 1336759, "ts": 1295650476728.957, "dur": 71.862, "args": { "External id": 14543,"Record function id": 0, "Ev Idx": 8038 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650476873.141, "dur": 48.523, "args": { "External id": 14544,"Record function id": 0, "Ev Idx": 8039 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.26)", "pid": 1336759, "tid": 1336759, "ts": 1295650476930.573, "dur": 18467.016, "args": { "External id": 14545,"Record function id": 0, "Ev Idx": 8040 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.26)", "pid": 1336759, "tid": 1336759, "ts": 1295650476939.938, "dur": 868.929, "args": { "External id": 14546,"Record function id": 0, "Ev Idx": 8041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650477058.846, "dur": 9.290, "args": { "External id": 14547,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650477082.741, "dur": 34.954, "args": { "External id": 14548,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 8043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477088.401, "dur": 2.302, "args": { "External id": 14549,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477094.716, "dur": 0.658, "args": { "External id": 14550,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477096.614, "dur": 0.582, "args": { "External id": 14551,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477098.648, "dur": 0.745, "args": { "External id": 14552,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477102.306, "dur": 0.636, "args": { "External id": 14553,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477104.339, "dur": 0.577, "args": { "External id": 14554,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477106.055, "dur": 2.134, "args": { "External id": 14555,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477109.379, "dur": 0.623, "args": { "External id": 14556,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477111.334, "dur": 0.436, "args": { "External id": 14557,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650477127.708, "dur": 39.940, "args": { "External id": 14558,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 8053 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650477200.447, "dur": 130.500, "args": { "External id": 14559,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 8054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650477210.706, "dur": 4.417, "args": { "External id": 14560,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650477219.736, "dur": 26.517, "args": { "External id": 14561,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 8056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650477224.185, "dur": 21.649, "args": { "External id": 14562,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 8057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477242.729, "dur": 0.980, "args": { "External id": 14563,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 8058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650477254.902, "dur": 30.968, "args": { "External id": 14564,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 8059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477256.909, "dur": 2.427, "args": { "External id": 14565,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477260.673, "dur": 0.603, "args": { "External id": 14566,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477265.927, "dur": 0.635, "args": { "External id": 14567,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477269.481, "dur": 0.694, "args": { "External id": 14568,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477271.243, "dur": 0.673, "args": { "External id": 14569,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477273.293, "dur": 1.820, "args": { "External id": 14570,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477276.309, "dur": 0.422, "args": { "External id": 14571,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477277.939, "dur": 0.632, "args": { "External id": 14572,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650477281.571, "dur": 0.669, "args": { "External id": 14573,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650477298.097, "dur": 24.476, "args": { "External id": 14574,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 8069 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650477384.494, "dur": 339.609, "args": { "External id": 14575,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 8070 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650477413.930, "dur": 305.278, "args": { "External id": 14576,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 8071, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650477423.890, "dur": 289.742, "args": { "External id": 14577,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 8072 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650477743.981, "dur": 1.846, "args": { "External id": 14578,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 8073, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.26)", "pid": 1336759, "tid": 1336759, "ts": 1295650477828.869, "dur": 17366.268, "args": { "External id": 14579,"Record function id": 0, "Ev Idx": 8074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650477918.829, "dur": 5.598, "args": { "External id": 14580,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 8075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650477927.840, "dur": 1.273, "args": { "External id": 14581,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 8076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650477935.104, "dur": 0.940, "args": { "External id": 14582,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650477938.938, "dur": 1.067, "args": { "External id": 14583,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650477941.228, "dur": 0.807, "args": { "External id": 14584,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650477943.543, "dur": 0.823, "args": { "External id": 14585,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650477945.898, "dur": 0.764, "args": { "External id": 14586,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 8081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650477949.914, "dur": 1.905, "args": { "External id": 14587,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650477953.008, "dur": 0.867, "args": { "External id": 14588,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650477955.374, "dur": 0.779, "args": { "External id": 14589,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8084 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650477975.151, "dur": 17181.823, "args": { "External id": 14590,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650478029.250, "dur": 17121.399, "args": { "External id": 14591,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650478049.370, "dur": 13.059, "args": { "External id": 14592,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650478066.992, "dur": 17053.854, "args": { "External id": 14593,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 8088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650478069.449, "dur": 17050.916, "args": { "External id": 14594,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 8089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650478075.056, "dur": 5.826, "args": { "External id": 14595,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650478082.545, "dur": 17034.980, "args": { "External id": 14596,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 8091 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650495338.840, "dur": 34.116, "args": { "External id": 14597,"Sequence number": 246593, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 8092 } }, { "ph": "s", "id": 175, "pid": 1336759, "tid": 1336759, "ts": 1295650495338.840, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650495354.479, "dur": 13.730, "args": { "External id": 14598,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 8093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650495363.311, "dur": 4.501, "args": { "External id": 14599,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8094 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650495434.983, "dur": 72.526, "args": { "External id": 14600,"Record function id": 0, "Ev Idx": 8095 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650495509.296, "dur": 1060.477, "args": { "External id": 14601,"Record function id": 0, "Ev Idx": 8096 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650495547.370, "dur": 1009.067, "args": { "External id": 14602,"Sequence number": 246594, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 8097 } }, { "ph": "s", "id": 174, "pid": 1336759, "tid": 1336759, "ts": 1295650495547.370, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650495617.850, "dur": 38.895, "args": { "External id": 14603,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650495669.173, "dur": 101.475, "args": { "External id": 14604,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650495779.181, "dur": 37.887, "args": { "External id": 14605,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650495824.989, "dur": 30.759, "args": { "External id": 14606,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8101 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650495878.315, "dur": 24.735, "args": { "External id": 14607,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8102 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650495921.221, "dur": 14.704, "args": { "External id": 14608,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8103 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650495951.710, "dur": 166.709, "args": { "External id": 14609,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650496040.191, "dur": 12.674, "args": { "External id": 14610,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650496045.212, "dur": 6.679, "args": { "External id": 14611,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650496055.392, "dur": 4.365, "args": { "External id": 14612,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650496061.044, "dur": 1.331, "args": { "External id": 14613,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650496064.711, "dur": 3.573, "args": { "External id": 14614,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650496129.042, "dur": 48.408, "args": { "External id": 14615,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8110 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650496208.390, "dur": 41.201, "args": { "External id": 14616,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650496260.787, "dur": 53.894, "args": { "External id": 14617,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650496325.937, "dur": 36.727, "args": { "External id": 14618,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8113 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650496384.901, "dur": 25.013, "args": { "External id": 14619,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 8114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650496415.926, "dur": 33.919, "args": { "External id": 14620,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 8115 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650496470.698, "dur": 18.762, "args": { "External id": 14621,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 8116 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.26)", "pid": 1336759, "tid": 1336759, "ts": 1295650496631.352, "dur": 71.091, "args": { "External id": 14622,"Record function id": 0, "Ev Idx": 8117 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336759, "tid": 1336759, "ts": 1295650496775.463, "dur": 45.324, "args": { "External id": 14623,"Record function id": 0, "Ev Idx": 8118 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.27)", "pid": 1336759, "tid": 1336759, "ts": 1295650496829.368, "dur": 18397.327, "args": { "External id": 14624,"Record function id": 0, "Ev Idx": 8119 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.27)", "pid": 1336759, "tid": 1336759, "ts": 1295650496836.882, "dur": 869.827, "args": { "External id": 14625,"Record function id": 0, "Ev Idx": 8120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650496913.610, "dur": 8.280, "args": { "External id": 14626,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650496934.740, "dur": 33.593, "args": { "External id": 14627,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 8122 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650496939.660, "dur": 2.167, "args": { "External id": 14628,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650496946.195, "dur": 0.422, "args": { "External id": 14629,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650496947.633, "dur": 0.804, "args": { "External id": 14630,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650496950.151, "dur": 0.743, "args": { "External id": 14631,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650496953.466, "dur": 0.722, "args": { "External id": 14632,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650496955.605, "dur": 0.665, "args": { "External id": 14633,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650496957.421, "dur": 2.386, "args": { "External id": 14634,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650496961.115, "dur": 0.492, "args": { "External id": 14635,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650496962.341, "dur": 0.622, "args": { "External id": 14636,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650496978.070, "dur": 83.537, "args": { "External id": 14637,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 8132 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336759, "tid": 1336759, "ts": 1295650497097.765, "dur": 111.158, "args": { "External id": 14638,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "6", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 8133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650497109.096, "dur": 4.725, "args": { "External id": 14639,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336759, "tid": 1336759, "ts": 1295650497118.437, "dur": 10.971, "args": { "External id": 14640,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 8135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650497122.938, "dur": 6.031, "args": { "External id": 14641,"Record function id": 0, "Concrete Inputs": ["", "0", "38538240", "44961280", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 8136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650497126.620, "dur": 0.896, "args": { "External id": 14642,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 8137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336759, "tid": 1336759, "ts": 1295650497137.058, "dur": 27.411, "args": { "External id": 14643,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 8138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650497138.883, "dur": 1.936, "args": { "External id": 14644,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "38538240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650497142.390, "dur": 0.534, "args": { "External id": 14645,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "38538496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650497143.975, "dur": 0.594, "args": { "External id": 14646,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39062784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650497147.789, "dur": 0.468, "args": { "External id": 14647,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "39587072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650497149.185, "dur": 0.791, "args": { "External id": 14648,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "40111360"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650497151.574, "dur": 0.517, "args": { "External id": 14649,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "40635648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650497154.644, "dur": 0.730, "args": { "External id": 14650,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "40635904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650497156.943, "dur": 0.600, "args": { "External id": 14651,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "42077696"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650497158.559, "dur": 1.939, "args": { "External id": 14652,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "43519488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650497179.075, "dur": 22.102, "args": { "External id": 14653,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 8148 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336759, "tid": 1336759, "ts": 1295650497281.271, "dur": 338.481, "args": { "External id": 14654,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 8149 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650497309.511, "dur": 305.610, "args": { "External id": 14655,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 6, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 8150, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336759, "tid": 1336759, "ts": 1295650497320.208, "dur": 289.829, "args": { "External id": 14656,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 8151 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295650497640.291, "dur": 2.321, "args": { "External id": 14657,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 8152, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.27)", "pid": 1336759, "tid": 1336759, "ts": 1295650497725.228, "dur": 17307.322, "args": { "External id": 14658,"Record function id": 0, "Ev Idx": 8153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650497828.202, "dur": 6.049, "args": { "External id": 14659,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 8154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650497837.551, "dur": 1.389, "args": { "External id": 14660,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 8155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650497840.584, "dur": 0.847, "args": { "External id": 14661,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650497844.791, "dur": 1.024, "args": { "External id": 14662,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650497847.186, "dur": 1.014, "args": { "External id": 14663,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650497849.422, "dur": 0.937, "args": { "External id": 14664,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650497851.897, "dur": 0.905, "args": { "External id": 14665,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 8160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650497856.190, "dur": 1.713, "args": { "External id": 14666,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650497859.438, "dur": 0.809, "args": { "External id": 14667,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650497861.763, "dur": 0.696, "args": { "External id": 14668,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8163 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650497880.686, "dur": 17077.457, "args": { "External id": 14669,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650497895.288, "dur": 17056.273, "args": { "External id": 14670,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650497913.942, "dur": 17.344, "args": { "External id": 14671,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650497935.813, "dur": 16985.010, "args": { "External id": 14672,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 8167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650497938.233, "dur": 16981.989, "args": { "External id": 14673,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 8168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650497943.814, "dur": 5.191, "args": { "External id": 14674,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650497950.638, "dur": 16966.464, "args": { "External id": 14675,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 8170 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650515167.045, "dur": 36.518, "args": { "External id": 14676,"Sequence number": 246595, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 8171 } }, { "ph": "s", "id": 173, "pid": 1336759, "tid": 1336759, "ts": 1295650515167.045, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295650515185.004, "dur": 13.732, "args": { "External id": 14677,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 8172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650515193.660, "dur": 4.750, "args": { "External id": 14678,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8173 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650515276.270, "dur": 74.962, "args": { "External id": 14679,"Record function id": 0, "Ev Idx": 8174 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336759, "tid": 1336759, "ts": 1295650515353.079, "dur": 1055.286, "args": { "External id": 14680,"Record function id": 0, "Ev Idx": 8175 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650515391.859, "dur": 1003.497, "args": { "External id": 14681,"Sequence number": 246596, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 8176 } }, { "ph": "s", "id": 172, "pid": 1336759, "tid": 1336759, "ts": 1295650515391.859, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650515459.023, "dur": 42.140, "args": { "External id": 14682,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650515514.068, "dur": 105.634, "args": { "External id": 14683,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650515627.960, "dur": 38.723, "args": { "External id": 14684,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650515674.988, "dur": 30.755, "args": { "External id": 14685,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8180 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650515728.953, "dur": 24.152, "args": { "External id": 14686,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8181 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336759, "tid": 1336759, "ts": 1295650515771.828, "dur": 14.089, "args": { "External id": 14687,"kernel_hash": "c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/5n/c5nleexjfe7ckjbhvsxfsribge47peqkyivjpkls2h4yztzme4px.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8182 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650515803.049, "dur": 122.300, "args": { "External id": 14688,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650515852.620, "dur": 11.806, "args": { "External id": 14689,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650515857.513, "dur": 6.172, "args": { "External id": 14690,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650515866.803, "dur": 4.193, "args": { "External id": 14691,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650515872.098, "dur": 1.832, "args": { "External id": 14692,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650515876.197, "dur": 2.734, "args": { "External id": 14693,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650515935.071, "dur": 44.720, "args": { "External id": 14694,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8189 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336759, "tid": 1336759, "ts": 1295650516056.259, "dur": 29.871, "args": { "External id": 14695,"kernel_hash": "c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/3l/c3la5vptoeqypxfxfvfv4bdw7i4xiukijyga2gm6nuqgqnu7xukn.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650516095.293, "dur": 44.378, "args": { "External id": 14696,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650516148.487, "dur": 34.213, "args": { "External id": 14697,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8192 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336759, "tid": 1336759, "ts": 1295650516203.226, "dur": 38.391, "args": { "External id": 14698,"kernel_hash": "ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/kq/ckqncfcfp3lv2zt52bvm43teupuhix6t4d4srlqovp6jq4mh7ayg.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 8193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650516249.695, "dur": 38.803, "args": { "External id": 14699,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 8194 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336759, "tid": 1336759, "ts": 1295650516310.922, "dur": 18.546, "args": { "External id": 14700,"kernel_hash": "cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/u6/cu627l3x7nht56wplsa2rqn4a3r4dce6couhabvxwttkx3auhd6p.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 8195 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.27)", "pid": 1336759, "tid": 1336759, "ts": 1295650516471.057, "dur": 33.779, "args": { "External id": 14701,"Record function id": 0, "Ev Idx": 8196 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650516638.321, "dur": 265.258, "args": { "External id": 14702,"Sequence number": 246597, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [], [], [], [], []], "Ev Idx": 8197 } }, { "ph": "s", "id": 171, "pid": 1336759, "tid": 1336759, "ts": 1295650516638.321, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650516670.296, "dur": 8.933, "args": { "External id": 14703,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650516673.080, "dur": 5.872, "args": { "External id": 14704,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650516689.159, "dur": 11.686, "args": { "External id": 14705,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650516692.364, "dur": 7.833, "args": { "External id": 14706,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650516709.443, "dur": 5.289, "args": { "External id": 14707,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650516886.196, "dur": 5.638, "args": { "External id": 14708,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650516889.154, "dur": 2.477, "args": { "External id": 14709,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650516930.312, "dur": 176.366, "args": { "External id": 14710,"Sequence number": 246598, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650516934.011, "dur": 15.828, "args": { "External id": 14711,"Sequence number": 246598, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8206 } }, { "ph": "s", "id": 170, "pid": 1336759, "tid": 1336759, "ts": 1295650516934.011, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650516940.045, "dur": 8.261, "args": { "External id": 14712,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650516945.946, "dur": 1.975, "args": { "External id": 14713,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650516952.279, "dur": 154.042, "args": { "External id": 14714,"Sequence number": 246599, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650516955.767, "dur": 4.887, "args": { "External id": 14715,"Sequence number": 246599, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650516956.560, "dur": 3.948, "args": { "External id": 14716,"Sequence number": 246599, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8211 } }, { "ph": "s", "id": 169, "pid": 1336759, "tid": 1336759, "ts": 1295650516956.560, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650516964.999, "dur": 129.658, "args": { "External id": 14717,"Sequence number": 246600, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8212 } }, { "ph": "s", "id": 168, "pid": 1336759, "tid": 1336759, "ts": 1295650516964.999, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650517099.256, "dur": 5.909, "args": { "External id": 14718,"Sequence number": 246601, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8213 } }, { "ph": "s", "id": 167, "pid": 1336759, "tid": 1336759, "ts": 1295650517099.256, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650517118.739, "dur": 71.443, "args": { "External id": 14719,"Sequence number": 246602, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650517120.197, "dur": 8.663, "args": { "External id": 14720,"Sequence number": 246602, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8215 } }, { "ph": "s", "id": 166, "pid": 1336759, "tid": 1336759, "ts": 1295650517120.197, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650517122.647, "dur": 5.110, "args": { "External id": 14721,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650517126.319, "dur": 1.177, "args": { "External id": 14722,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650517129.724, "dur": 60.160, "args": { "External id": 14723,"Sequence number": 246603, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650517130.732, "dur": 5.491, "args": { "External id": 14724,"Sequence number": 246603, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650517131.650, "dur": 4.411, "args": { "External id": 14725,"Sequence number": 246603, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8220 } }, { "ph": "s", "id": 165, "pid": 1336759, "tid": 1336759, "ts": 1295650517131.650, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650517136.929, "dur": 46.718, "args": { "External id": 14726,"Sequence number": 246604, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8221 } }, { "ph": "s", "id": 164, "pid": 1336759, "tid": 1336759, "ts": 1295650517136.929, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650517185.311, "dur": 4.146, "args": { "External id": 14727,"Sequence number": 246605, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8222 } }, { "ph": "s", "id": 163, "pid": 1336759, "tid": 1336759, "ts": 1295650517185.311, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650517197.646, "dur": 83.724, "args": { "External id": 14728,"Sequence number": 246606, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650517198.217, "dur": 5.046, "args": { "External id": 14729,"Sequence number": 246606, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8224 } }, { "ph": "s", "id": 162, "pid": 1336759, "tid": 1336759, "ts": 1295650517198.217, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650517199.779, "dur": 2.376, "args": { "External id": 14730,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650517201.210, "dur": 0.794, "args": { "External id": 14731,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650517205.696, "dur": 75.498, "args": { "External id": 14732,"Sequence number": 246607, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650517206.926, "dur": 4.395, "args": { "External id": 14733,"Sequence number": 246607, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650517207.771, "dur": 3.411, "args": { "External id": 14734,"Sequence number": 246607, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8229 } }, { "ph": "s", "id": 161, "pid": 1336759, "tid": 1336759, "ts": 1295650517207.771, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650517211.935, "dur": 59.835, "args": { "External id": 14735,"Sequence number": 246608, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8230 } }, { "ph": "s", "id": 160, "pid": 1336759, "tid": 1336759, "ts": 1295650517211.935, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650517274.389, "dur": 6.199, "args": { "External id": 14736,"Sequence number": 246609, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8231 } }, { "ph": "s", "id": 159, "pid": 1336759, "tid": 1336759, "ts": 1295650517274.389, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650517305.440, "dur": 3.981, "args": { "External id": 14737,"Sequence number": 246610, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650517306.187, "dur": 3.096, "args": { "External id": 14738,"Sequence number": 246610, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8233 } }, { "ph": "s", "id": 158, "pid": 1336759, "tid": 1336759, "ts": 1295650517306.187, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650517316.097, "dur": 3.034, "args": { "External id": 14739,"Sequence number": 246611, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650517317.054, "dur": 1.951, "args": { "External id": 14740,"Sequence number": 246611, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8235 } }, { "ph": "s", "id": 157, "pid": 1336759, "tid": 1336759, "ts": 1295650517317.054, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650517325.216, "dur": 4.967, "args": { "External id": 14741,"Sequence number": 246612, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650517326.059, "dur": 3.990, "args": { "External id": 14742,"Sequence number": 246612, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8237 } }, { "ph": "s", "id": 156, "pid": 1336759, "tid": 1336759, "ts": 1295650517326.059, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650517366.747, "dur": 180.821, "args": { "External id": 14743,"Sequence number": 246613, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8238 } }, { "ph": "s", "id": 155, "pid": 1336759, "tid": 1336759, "ts": 1295650517366.747, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650517390.030, "dur": 9.851, "args": { "External id": 14744,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650517393.093, "dur": 6.275, "args": { "External id": 14745,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8240 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650517560.645, "dur": 108.452, "args": { "External id": 14746,"Sequence number": 246614, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8241 } }, { "ph": "s", "id": 154, "pid": 1336759, "tid": 1336759, "ts": 1295650517560.645, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650517575.262, "dur": 6.419, "args": { "External id": 14747,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650517577.386, "dur": 3.834, "args": { "External id": 14748,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8243 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 1336759, "tid": 1336759, "ts": 1295650517699.020, "dur": 172.931, "args": { "External id": 14749,"Sequence number": 246615, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 8244 } }, { "ph": "s", "id": 153, "pid": 1336759, "tid": 1336759, "ts": 1295650517699.020, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650517727.755, "dur": 116.701, "args": { "External id": 14750,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650517774.449, "dur": 6.597, "args": { "External id": 14751,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650517776.788, "dur": 3.774, "args": { "External id": 14752,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650517783.777, "dur": 4.093, "args": { "External id": 14753,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650517789.051, "dur": 1.601, "args": { "External id": 14754,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650517794.926, "dur": 2.788, "args": { "External id": 14755,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336759, "tid": 1336759, "ts": 1295650517858.423, "dur": 4.724, "args": { "External id": 14756,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 8251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650517876.807, "dur": 5.443, "args": { "External id": 14757,"Sequence number": 246616, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650517878.269, "dur": 3.858, "args": { "External id": 14758,"Sequence number": 246616, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8253 } }, { "ph": "s", "id": 152, "pid": 1336759, "tid": 1336759, "ts": 1295650517878.269, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650517897.701, "dur": 167.840, "args": { "External id": 14759,"Sequence number": 246617, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650517900.705, "dur": 8.551, "args": { "External id": 14760,"Sequence number": 246617, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8255 } }, { "ph": "s", "id": 151, "pid": 1336759, "tid": 1336759, "ts": 1295650517900.705, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650517903.527, "dur": 4.664, "args": { "External id": 14761,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650517906.290, "dur": 1.662, "args": { "External id": 14762,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650517910.510, "dur": 154.683, "args": { "External id": 14763,"Sequence number": 246618, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650517912.103, "dur": 9.051, "args": { "External id": 14764,"Sequence number": 246618, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650517915.277, "dur": 5.659, "args": { "External id": 14765,"Sequence number": 246618, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8260 } }, { "ph": "s", "id": 150, "pid": 1336759, "tid": 1336759, "ts": 1295650517915.277, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650517922.194, "dur": 132.494, "args": { "External id": 14766,"Sequence number": 246619, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8261 } }, { "ph": "s", "id": 149, "pid": 1336759, "tid": 1336759, "ts": 1295650517922.194, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650518058.315, "dur": 5.979, "args": { "External id": 14767,"Sequence number": 246620, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8262 } }, { "ph": "s", "id": 148, "pid": 1336759, "tid": 1336759, "ts": 1295650518058.315, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650518104.168, "dur": 254.489, "args": { "External id": 14768,"Sequence number": 246621, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [16, 4096, 2048], [], [], [], []], "Ev Idx": 8263 } }, { "ph": "s", "id": 147, "pid": 1336759, "tid": 1336759, "ts": 1295650518104.168, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650518126.251, "dur": 3.203, "args": { "External id": 14769,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650518127.094, "dur": 2.038, "args": { "External id": 14770,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 1336759, "tid": 1336759, "ts": 1295650518135.360, "dur": 3.271, "args": { "External id": 14771,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [2048, 1]], "Input Dims": [[16, 4096, 2048], [65536, 2048]], "Ev Idx": 8266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650518136.278, "dur": 2.248, "args": { "External id": 14772,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650518137.206, "dur": 1.208, "args": { "External id": 14773,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650518146.340, "dur": 9.983, "args": { "External id": 14774,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650518150.159, "dur": 5.824, "args": { "External id": 14775,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650518162.602, "dur": 3.341, "args": { "External id": 14776,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650518169.548, "dur": 2.852, "args": { "External id": 14777,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650518331.833, "dur": 4.496, "args": { "External id": 14778,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650518333.038, "dur": 2.938, "args": { "External id": 14779,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650518338.879, "dur": 2.125, "args": { "External id": 14780,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650518339.872, "dur": 0.977, "args": { "External id": 14781,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650518379.986, "dur": 101.868, "args": { "External id": 14782,"Sequence number": 246622, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650518381.234, "dur": 7.868, "args": { "External id": 14783,"Sequence number": 246622, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8278 } }, { "ph": "s", "id": 146, "pid": 1336759, "tid": 1336759, "ts": 1295650518381.234, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650518383.677, "dur": 4.149, "args": { "External id": 14784,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650518385.851, "dur": 1.552, "args": { "External id": 14785,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650518390.078, "dur": 91.426, "args": { "External id": 14786,"Sequence number": 246623, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650518393.372, "dur": 3.509, "args": { "External id": 14787,"Sequence number": 246623, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650518394.081, "dur": 2.669, "args": { "External id": 14788,"Sequence number": 246623, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8283 } }, { "ph": "s", "id": 145, "pid": 1336759, "tid": 1336759, "ts": 1295650518394.081, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650518397.912, "dur": 77.815, "args": { "External id": 14789,"Sequence number": 246624, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8284 } }, { "ph": "s", "id": 144, "pid": 1336759, "tid": 1336759, "ts": 1295650518397.912, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650518477.996, "dur": 2.855, "args": { "External id": 14790,"Sequence number": 246625, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8285 } }, { "ph": "s", "id": 143, "pid": 1336759, "tid": 1336759, "ts": 1295650518477.996, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650518490.127, "dur": 71.037, "args": { "External id": 14791,"Sequence number": 246626, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650518492.747, "dur": 6.034, "args": { "External id": 14792,"Sequence number": 246626, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8287 } }, { "ph": "s", "id": 142, "pid": 1336759, "tid": 1336759, "ts": 1295650518492.747, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650518494.501, "dur": 3.084, "args": { "External id": 14793,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650518495.810, "dur": 1.357, "args": { "External id": 14794,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650518499.550, "dur": 61.356, "args": { "External id": 14795,"Sequence number": 246627, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650518501.007, "dur": 7.747, "args": { "External id": 14796,"Sequence number": 246627, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650518503.796, "dur": 4.793, "args": { "External id": 14797,"Sequence number": 246627, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8292 } }, { "ph": "s", "id": 141, "pid": 1336759, "tid": 1336759, "ts": 1295650518503.796, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650518509.508, "dur": 44.860, "args": { "External id": 14798,"Sequence number": 246628, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8293 } }, { "ph": "s", "id": 140, "pid": 1336759, "tid": 1336759, "ts": 1295650518509.508, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650518555.987, "dur": 4.598, "args": { "External id": 14799,"Sequence number": 246629, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8294 } }, { "ph": "s", "id": 139, "pid": 1336759, "tid": 1336759, "ts": 1295650518555.987, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650518583.382, "dur": 152.713, "args": { "External id": 14800,"Sequence number": 246630, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8295 } }, { "ph": "s", "id": 138, "pid": 1336759, "tid": 1336759, "ts": 1295650518583.382, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650518628.058, "dur": 4.758, "args": { "External id": 14801,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650518667.239, "dur": 56.022, "args": { "External id": 14802,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650518668.107, "dur": 4.220, "args": { "External id": 14803,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 8298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650518669.049, "dur": 2.551, "args": { "External id": 14804,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 8299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650518670.588, "dur": 0.862, "args": { "External id": 14805,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 8300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650518673.046, "dur": 49.884, "args": { "External id": 14806,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[23068672, 5632, 1], [1, 5632]], "Input Dims": [[16, 4096, 5632], [5632, 2048]], "Ev Idx": 8301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650518676.059, "dur": 2.639, "args": { "External id": 14807,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650518677.000, "dur": 1.571, "args": { "External id": 14808,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650518679.191, "dur": 40.393, "args": { "External id": 14809,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 8304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650518721.245, "dur": 1.083, "args": { "External id": 14810,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336759, "tid": 1336759, "ts": 1295650518745.356, "dur": 25.241, "args": { "External id": 14811,"Sequence number": 246631, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 8306 } }, { "ph": "s", "id": 137, "pid": 1336759, "tid": 1336759, "ts": 1295650518745.356, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650518802.940, "dur": 220.107, "args": { "External id": 14812,"Sequence number": 246632, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [], [], [], [], []], "Ev Idx": 8307 } }, { "ph": "s", "id": 136, "pid": 1336759, "tid": 1336759, "ts": 1295650518802.940, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650518823.125, "dur": 5.193, "args": { "External id": 14813,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650518825.984, "dur": 2.214, "args": { "External id": 14814,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650518835.369, "dur": 6.857, "args": { "External id": 14815,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650518837.754, "dur": 4.148, "args": { "External id": 14816,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650518847.718, "dur": 3.199, "args": { "External id": 14817,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650518964.039, "dur": 7.438, "args": { "External id": 14818,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650518964.990, "dur": 6.318, "args": { "External id": 14819,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650519043.800, "dur": 89.957, "args": { "External id": 14820,"Sequence number": 246633, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650519044.853, "dur": 9.597, "args": { "External id": 14821,"Sequence number": 246633, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8316 } }, { "ph": "s", "id": 135, "pid": 1336759, "tid": 1336759, "ts": 1295650519044.853, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650519048.761, "dur": 4.164, "args": { "External id": 14822,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650519050.885, "dur": 1.805, "args": { "External id": 14823,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650519055.346, "dur": 78.119, "args": { "External id": 14824,"Sequence number": 246634, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650519056.834, "dur": 5.714, "args": { "External id": 14825,"Sequence number": 246634, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650519059.298, "dur": 3.123, "args": { "External id": 14826,"Sequence number": 246634, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8321 } }, { "ph": "s", "id": 134, "pid": 1336759, "tid": 1336759, "ts": 1295650519059.298, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650519063.244, "dur": 65.186, "args": { "External id": 14827,"Sequence number": 246635, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8322 } }, { "ph": "s", "id": 133, "pid": 1336759, "tid": 1336759, "ts": 1295650519063.244, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650519130.143, "dur": 2.666, "args": { "External id": 14828,"Sequence number": 246636, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8323 } }, { "ph": "s", "id": 132, "pid": 1336759, "tid": 1336759, "ts": 1295650519130.143, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650519142.177, "dur": 64.052, "args": { "External id": 14829,"Sequence number": 246637, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650519142.887, "dur": 9.664, "args": { "External id": 14830,"Sequence number": 246637, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8325 } }, { "ph": "s", "id": 131, "pid": 1336759, "tid": 1336759, "ts": 1295650519142.887, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650519148.687, "dur": 2.649, "args": { "External id": 14831,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650519150.186, "dur": 0.992, "args": { "External id": 14832,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650519153.327, "dur": 52.640, "args": { "External id": 14833,"Sequence number": 246638, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650519154.233, "dur": 4.726, "args": { "External id": 14834,"Sequence number": 246638, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650519155.726, "dur": 3.103, "args": { "External id": 14835,"Sequence number": 246638, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8330 } }, { "ph": "s", "id": 130, "pid": 1336759, "tid": 1336759, "ts": 1295650519155.726, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650519159.553, "dur": 42.615, "args": { "External id": 14836,"Sequence number": 246639, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8331 } }, { "ph": "s", "id": 129, "pid": 1336759, "tid": 1336759, "ts": 1295650519159.553, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650519203.781, "dur": 1.830, "args": { "External id": 14837,"Sequence number": 246640, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8332 } }, { "ph": "s", "id": 128, "pid": 1336759, "tid": 1336759, "ts": 1295650519203.781, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650519213.242, "dur": 81.318, "args": { "External id": 14838,"Sequence number": 246641, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650519213.914, "dur": 7.408, "args": { "External id": 14839,"Sequence number": 246641, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8334 } }, { "ph": "s", "id": 127, "pid": 1336759, "tid": 1336759, "ts": 1295650519213.914, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650519215.548, "dur": 4.774, "args": { "External id": 14840,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650519218.069, "dur": 2.044, "args": { "External id": 14841,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650519222.180, "dur": 72.158, "args": { "External id": 14842,"Sequence number": 246642, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650519223.288, "dur": 19.423, "args": { "External id": 14843,"Sequence number": 246642, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650519224.020, "dur": 18.021, "args": { "External id": 14844,"Sequence number": 246642, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8339 } }, { "ph": "s", "id": 126, "pid": 1336759, "tid": 1336759, "ts": 1295650519224.020, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650519245.741, "dur": 42.098, "args": { "External id": 14845,"Sequence number": 246643, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8340 } }, { "ph": "s", "id": 125, "pid": 1336759, "tid": 1336759, "ts": 1295650519245.741, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650519289.567, "dur": 4.254, "args": { "External id": 14846,"Sequence number": 246644, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8341 } }, { "ph": "s", "id": 124, "pid": 1336759, "tid": 1336759, "ts": 1295650519289.567, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650519312.244, "dur": 4.204, "args": { "External id": 14847,"Sequence number": 246645, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650519312.992, "dur": 3.309, "args": { "External id": 14848,"Sequence number": 246645, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8343 } }, { "ph": "s", "id": 123, "pid": 1336759, "tid": 1336759, "ts": 1295650519312.992, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650519349.219, "dur": 7.406, "args": { "External id": 14849,"Sequence number": 246646, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650519352.019, "dur": 4.486, "args": { "External id": 14850,"Sequence number": 246646, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8345 } }, { "ph": "s", "id": 122, "pid": 1336759, "tid": 1336759, "ts": 1295650519352.019, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650519360.785, "dur": 4.451, "args": { "External id": 14851,"Sequence number": 246647, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650519361.508, "dur": 3.584, "args": { "External id": 14852,"Sequence number": 246647, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8347 } }, { "ph": "s", "id": 121, "pid": 1336759, "tid": 1336759, "ts": 1295650519361.508, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650519396.689, "dur": 157.696, "args": { "External id": 14853,"Sequence number": 246648, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8348 } }, { "ph": "s", "id": 120, "pid": 1336759, "tid": 1336759, "ts": 1295650519396.689, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650519415.923, "dur": 8.307, "args": { "External id": 14854,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650519418.490, "dur": 5.197, "args": { "External id": 14855,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8350 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650519567.950, "dur": 99.418, "args": { "External id": 14856,"Sequence number": 246649, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8351 } }, { "ph": "s", "id": 119, "pid": 1336759, "tid": 1336759, "ts": 1295650519567.950, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650519581.881, "dur": 6.424, "args": { "External id": 14857,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650519583.549, "dur": 4.277, "args": { "External id": 14858,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8353 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 1336759, "tid": 1336759, "ts": 1295650519693.299, "dur": 167.381, "args": { "External id": 14859,"Sequence number": 246650, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 8354 } }, { "ph": "s", "id": 118, "pid": 1336759, "tid": 1336759, "ts": 1295650519693.299, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650519721.004, "dur": 116.444, "args": { "External id": 14860,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650519766.100, "dur": 7.252, "args": { "External id": 14861,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650519768.517, "dur": 4.397, "args": { "External id": 14862,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650519776.171, "dur": 3.814, "args": { "External id": 14863,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650519781.140, "dur": 3.239, "args": { "External id": 14864,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650519786.910, "dur": 3.114, "args": { "External id": 14865,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336759, "tid": 1336759, "ts": 1295650519848.278, "dur": 4.318, "args": { "External id": 14866,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 8361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650519864.621, "dur": 7.110, "args": { "External id": 14867,"Sequence number": 246651, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650519866.033, "dur": 5.573, "args": { "External id": 14868,"Sequence number": 246651, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8363 } }, { "ph": "s", "id": 117, "pid": 1336759, "tid": 1336759, "ts": 1295650519866.033, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650519886.410, "dur": 91.756, "args": { "External id": 14869,"Sequence number": 246652, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650519887.405, "dur": 7.447, "args": { "External id": 14870,"Sequence number": 246652, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8365 } }, { "ph": "s", "id": 116, "pid": 1336759, "tid": 1336759, "ts": 1295650519887.405, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650519890.115, "dur": 3.766, "args": { "External id": 14871,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650519892.195, "dur": 1.423, "args": { "External id": 14872,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650519895.669, "dur": 82.192, "args": { "External id": 14873,"Sequence number": 246653, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650519898.944, "dur": 3.709, "args": { "External id": 14874,"Sequence number": 246653, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650519899.572, "dur": 2.935, "args": { "External id": 14875,"Sequence number": 246653, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8370 } }, { "ph": "s", "id": 115, "pid": 1336759, "tid": 1336759, "ts": 1295650519899.572, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650519903.572, "dur": 66.992, "args": { "External id": 14876,"Sequence number": 246654, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8371 } }, { "ph": "s", "id": 114, "pid": 1336759, "tid": 1336759, "ts": 1295650519903.572, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650519972.278, "dur": 4.929, "args": { "External id": 14877,"Sequence number": 246655, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8372 } }, { "ph": "s", "id": 113, "pid": 1336759, "tid": 1336759, "ts": 1295650519972.278, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650520052.680, "dur": 223.703, "args": { "External id": 14878,"Sequence number": 246656, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [16, 4096, 2048], [], [], [], []], "Ev Idx": 8373 } }, { "ph": "s", "id": 112, "pid": 1336759, "tid": 1336759, "ts": 1295650520052.680, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650520075.007, "dur": 3.369, "args": { "External id": 14879,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650520075.816, "dur": 2.295, "args": { "External id": 14880,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 1336759, "tid": 1336759, "ts": 1295650520082.334, "dur": 4.534, "args": { "External id": 14881,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [2048, 1]], "Input Dims": [[16, 4096, 2048], [65536, 2048]], "Ev Idx": 8376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650520083.324, "dur": 3.433, "args": { "External id": 14882,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650520085.539, "dur": 1.096, "args": { "External id": 14883,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650520094.196, "dur": 7.446, "args": { "External id": 14884,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650520095.972, "dur": 5.306, "args": { "External id": 14885,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650520107.503, "dur": 3.397, "args": { "External id": 14886,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650520114.334, "dur": 3.398, "args": { "External id": 14887,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650520251.170, "dur": 4.025, "args": { "External id": 14888,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650520252.304, "dur": 2.573, "args": { "External id": 14889,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650520259.598, "dur": 2.124, "args": { "External id": 14890,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650520260.534, "dur": 1.067, "args": { "External id": 14891,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650520294.521, "dur": 94.348, "args": { "External id": 14892,"Sequence number": 246657, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650520295.514, "dur": 7.310, "args": { "External id": 14893,"Sequence number": 246657, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8388 } }, { "ph": "s", "id": 111, "pid": 1336759, "tid": 1336759, "ts": 1295650520295.514, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650520298.004, "dur": 3.827, "args": { "External id": 14894,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650520300.250, "dur": 1.362, "args": { "External id": 14895,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650520305.419, "dur": 83.172, "args": { "External id": 14896,"Sequence number": 246658, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650520306.780, "dur": 3.132, "args": { "External id": 14897,"Sequence number": 246658, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650520307.742, "dur": 2.039, "args": { "External id": 14898,"Sequence number": 246658, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8393 } }, { "ph": "s", "id": 110, "pid": 1336759, "tid": 1336759, "ts": 1295650520307.742, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650520310.863, "dur": 71.573, "args": { "External id": 14899,"Sequence number": 246659, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8394 } }, { "ph": "s", "id": 109, "pid": 1336759, "tid": 1336759, "ts": 1295650520310.863, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650520384.198, "dur": 3.836, "args": { "External id": 14900,"Sequence number": 246660, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8395 } }, { "ph": "s", "id": 108, "pid": 1336759, "tid": 1336759, "ts": 1295650520384.198, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650520397.102, "dur": 65.098, "args": { "External id": 14901,"Sequence number": 246661, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650520397.786, "dur": 5.543, "args": { "External id": 14902,"Sequence number": 246661, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8397 } }, { "ph": "s", "id": 107, "pid": 1336759, "tid": 1336759, "ts": 1295650520397.786, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650520399.656, "dur": 2.700, "args": { "External id": 14903,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650520401.149, "dur": 1.057, "args": { "External id": 14904,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650520404.088, "dur": 57.912, "args": { "External id": 14905,"Sequence number": 246662, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650520406.662, "dur": 5.952, "args": { "External id": 14906,"Sequence number": 246662, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650520407.485, "dur": 4.959, "args": { "External id": 14907,"Sequence number": 246662, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8402 } }, { "ph": "s", "id": 106, "pid": 1336759, "tid": 1336759, "ts": 1295650520407.485, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650520413.312, "dur": 42.523, "args": { "External id": 14908,"Sequence number": 246663, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8403 } }, { "ph": "s", "id": 105, "pid": 1336759, "tid": 1336759, "ts": 1295650520413.312, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650520457.424, "dur": 4.198, "args": { "External id": 14909,"Sequence number": 246664, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8404 } }, { "ph": "s", "id": 104, "pid": 1336759, "tid": 1336759, "ts": 1295650520457.424, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650520483.112, "dur": 138.218, "args": { "External id": 14910,"Sequence number": 246665, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8405 } }, { "ph": "s", "id": 103, "pid": 1336759, "tid": 1336759, "ts": 1295650520483.112, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650520519.931, "dur": 4.220, "args": { "External id": 14911,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650520553.534, "dur": 55.924, "args": { "External id": 14912,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650520554.196, "dur": 4.948, "args": { "External id": 14913,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 8408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650520555.519, "dur": 2.729, "args": { "External id": 14914,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 8409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650520557.174, "dur": 0.913, "args": { "External id": 14915,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 8410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650520561.310, "dur": 47.873, "args": { "External id": 14916,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[23068672, 5632, 1], [1, 5632]], "Input Dims": [[16, 4096, 5632], [5632, 2048]], "Ev Idx": 8411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650520562.387, "dur": 2.293, "args": { "External id": 14917,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650520563.291, "dur": 1.275, "args": { "External id": 14918,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650520565.263, "dur": 40.568, "args": { "External id": 14919,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 8414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650520607.558, "dur": 1.055, "args": { "External id": 14920,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336759, "tid": 1336759, "ts": 1295650520629.483, "dur": 23.284, "args": { "External id": 14921,"Sequence number": 246666, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 8416 } }, { "ph": "s", "id": 102, "pid": 1336759, "tid": 1336759, "ts": 1295650520629.483, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650520684.794, "dur": 176.932, "args": { "External id": 14922,"Sequence number": 246667, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [], [], [], [], []], "Ev Idx": 8417 } }, { "ph": "s", "id": 101, "pid": 1336759, "tid": 1336759, "ts": 1295650520684.794, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650520705.141, "dur": 2.919, "args": { "External id": 14923,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650520706.046, "dur": 1.886, "args": { "External id": 14924,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650520715.105, "dur": 6.806, "args": { "External id": 14925,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650520717.390, "dur": 4.143, "args": { "External id": 14926,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650520727.702, "dur": 3.698, "args": { "External id": 14927,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650520845.789, "dur": 2.996, "args": { "External id": 14928,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650520846.704, "dur": 1.853, "args": { "External id": 14929,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650520879.035, "dur": 79.463, "args": { "External id": 14930,"Sequence number": 246668, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650520879.996, "dur": 5.872, "args": { "External id": 14931,"Sequence number": 246668, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8426 } }, { "ph": "s", "id": 100, "pid": 1336759, "tid": 1336759, "ts": 1295650520879.996, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650520881.773, "dur": 3.070, "args": { "External id": 14932,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650520883.441, "dur": 1.240, "args": { "External id": 14933,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650520886.745, "dur": 71.528, "args": { "External id": 14934,"Sequence number": 246669, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650520889.467, "dur": 3.994, "args": { "External id": 14935,"Sequence number": 246669, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650520890.435, "dur": 2.880, "args": { "External id": 14936,"Sequence number": 246669, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8431 } }, { "ph": "s", "id": 99, "pid": 1336759, "tid": 1336759, "ts": 1295650520890.435, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650520894.428, "dur": 56.643, "args": { "External id": 14937,"Sequence number": 246670, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8432 } }, { "ph": "s", "id": 98, "pid": 1336759, "tid": 1336759, "ts": 1295650520894.428, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650520952.822, "dur": 4.889, "args": { "External id": 14938,"Sequence number": 246671, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8433 } }, { "ph": "s", "id": 97, "pid": 1336759, "tid": 1336759, "ts": 1295650520952.822, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650520965.398, "dur": 106.657, "args": { "External id": 14939,"Sequence number": 246672, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650520967.668, "dur": 5.016, "args": { "External id": 14940,"Sequence number": 246672, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8435 } }, { "ph": "s", "id": 96, "pid": 1336759, "tid": 1336759, "ts": 1295650520967.668, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650520969.745, "dur": 2.113, "args": { "External id": 14941,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650520971.005, "dur": 0.721, "args": { "External id": 14942,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650520973.203, "dur": 98.614, "args": { "External id": 14943,"Sequence number": 246673, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650520974.072, "dur": 4.302, "args": { "External id": 14944,"Sequence number": 246673, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650520976.275, "dur": 1.952, "args": { "External id": 14945,"Sequence number": 246673, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8440 } }, { "ph": "s", "id": 95, "pid": 1336759, "tid": 1336759, "ts": 1295650520976.275, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650520978.842, "dur": 87.196, "args": { "External id": 14946,"Sequence number": 246674, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8441 } }, { "ph": "s", "id": 94, "pid": 1336759, "tid": 1336759, "ts": 1295650520978.842, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650521068.634, "dur": 2.671, "args": { "External id": 14947,"Sequence number": 246675, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8442 } }, { "ph": "s", "id": 93, "pid": 1336759, "tid": 1336759, "ts": 1295650521068.634, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650521080.171, "dur": 60.459, "args": { "External id": 14948,"Sequence number": 246676, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650521080.818, "dur": 7.954, "args": { "External id": 14949,"Sequence number": 246676, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8444 } }, { "ph": "s", "id": 92, "pid": 1336759, "tid": 1336759, "ts": 1295650521080.818, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650521083.968, "dur": 3.742, "args": { "External id": 14950,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650521085.387, "dur": 2.123, "args": { "External id": 14951,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650521089.460, "dur": 50.914, "args": { "External id": 14952,"Sequence number": 246677, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650521090.400, "dur": 5.973, "args": { "External id": 14953,"Sequence number": 246677, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650521092.855, "dur": 3.238, "args": { "External id": 14954,"Sequence number": 246677, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8449 } }, { "ph": "s", "id": 91, "pid": 1336759, "tid": 1336759, "ts": 1295650521092.855, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650521097.111, "dur": 37.690, "args": { "External id": 14955,"Sequence number": 246678, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8450 } }, { "ph": "s", "id": 90, "pid": 1336759, "tid": 1336759, "ts": 1295650521097.111, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650521136.381, "dur": 3.600, "args": { "External id": 14956,"Sequence number": 246679, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8451 } }, { "ph": "s", "id": 89, "pid": 1336759, "tid": 1336759, "ts": 1295650521136.381, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650521156.980, "dur": 4.637, "args": { "External id": 14957,"Sequence number": 246680, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650521157.660, "dur": 3.646, "args": { "External id": 14958,"Sequence number": 246680, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8453 } }, { "ph": "s", "id": 88, "pid": 1336759, "tid": 1336759, "ts": 1295650521157.660, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650521168.043, "dur": 2.993, "args": { "External id": 14959,"Sequence number": 246681, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650521168.883, "dur": 2.031, "args": { "External id": 14960,"Sequence number": 246681, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8455 } }, { "ph": "s", "id": 87, "pid": 1336759, "tid": 1336759, "ts": 1295650521168.883, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650521175.477, "dur": 2.864, "args": { "External id": 14961,"Sequence number": 246682, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650521176.327, "dur": 1.891, "args": { "External id": 14962,"Sequence number": 246682, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8457 } }, { "ph": "s", "id": 86, "pid": 1336759, "tid": 1336759, "ts": 1295650521176.327, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650521208.022, "dur": 176.118, "args": { "External id": 14963,"Sequence number": 246683, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8458 } }, { "ph": "s", "id": 85, "pid": 1336759, "tid": 1336759, "ts": 1295650521208.022, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650521243.569, "dur": 10.685, "args": { "External id": 14964,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650521246.120, "dur": 7.366, "args": { "External id": 14965,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8460 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650521397.253, "dur": 100.821, "args": { "External id": 14966,"Sequence number": 246684, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8461 } }, { "ph": "s", "id": 84, "pid": 1336759, "tid": 1336759, "ts": 1295650521397.253, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650521411.179, "dur": 6.425, "args": { "External id": 14967,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650521413.024, "dur": 4.235, "args": { "External id": 14968,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8463 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 1336759, "tid": 1336759, "ts": 1295650521524.927, "dur": 165.852, "args": { "External id": 14969,"Sequence number": 246685, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 8464 } }, { "ph": "s", "id": 83, "pid": 1336759, "tid": 1336759, "ts": 1295650521524.927, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650521550.203, "dur": 116.068, "args": { "External id": 14970,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650521595.663, "dur": 6.592, "args": { "External id": 14971,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650521597.901, "dur": 3.920, "args": { "External id": 14972,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650521604.668, "dur": 3.941, "args": { "External id": 14973,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650521609.654, "dur": 1.560, "args": { "External id": 14974,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650521614.087, "dur": 3.095, "args": { "External id": 14975,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336759, "tid": 1336759, "ts": 1295650521677.270, "dur": 5.015, "args": { "External id": 14976,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 8471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650521695.295, "dur": 5.950, "args": { "External id": 14977,"Sequence number": 246686, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650521697.309, "dur": 3.817, "args": { "External id": 14978,"Sequence number": 246686, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8473 } }, { "ph": "s", "id": 82, "pid": 1336759, "tid": 1336759, "ts": 1295650521697.309, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650521712.751, "dur": 96.481, "args": { "External id": 14979,"Sequence number": 246687, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650521713.895, "dur": 10.944, "args": { "External id": 14980,"Sequence number": 246687, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8475 } }, { "ph": "s", "id": 81, "pid": 1336759, "tid": 1336759, "ts": 1295650521713.895, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650521718.488, "dur": 5.353, "args": { "External id": 14981,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650521722.290, "dur": 1.318, "args": { "External id": 14982,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650521725.819, "dur": 83.090, "args": { "External id": 14983,"Sequence number": 246688, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650521727.407, "dur": 2.794, "args": { "External id": 14984,"Sequence number": 246688, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650521728.114, "dur": 1.978, "args": { "External id": 14985,"Sequence number": 246688, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8480 } }, { "ph": "s", "id": 80, "pid": 1336759, "tid": 1336759, "ts": 1295650521728.114, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650521731.094, "dur": 70.261, "args": { "External id": 14986,"Sequence number": 246689, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8481 } }, { "ph": "s", "id": 79, "pid": 1336759, "tid": 1336759, "ts": 1295650521731.094, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650521803.567, "dur": 4.649, "args": { "External id": 14987,"Sequence number": 246690, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8482 } }, { "ph": "s", "id": 78, "pid": 1336759, "tid": 1336759, "ts": 1295650521803.567, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650521840.083, "dur": 239.359, "args": { "External id": 14988,"Sequence number": 246691, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [16, 4096, 2048], [], [], [], []], "Ev Idx": 8483 } }, { "ph": "s", "id": 77, "pid": 1336759, "tid": 1336759, "ts": 1295650521840.083, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650521856.627, "dur": 2.377, "args": { "External id": 14989,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650521857.480, "dur": 1.400, "args": { "External id": 14990,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 1336759, "tid": 1336759, "ts": 1295650521862.806, "dur": 4.474, "args": { "External id": 14991,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [2048, 1]], "Input Dims": [[16, 4096, 2048], [65536, 2048]], "Ev Idx": 8486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650521865.373, "dur": 1.796, "args": { "External id": 14992,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650521865.955, "dur": 1.099, "args": { "External id": 14993,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650521873.852, "dur": 6.771, "args": { "External id": 14994,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650521875.591, "dur": 4.749, "args": { "External id": 14995,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650521886.308, "dur": 2.838, "args": { "External id": 14996,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650521892.554, "dur": 3.248, "args": { "External id": 14997,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650522055.692, "dur": 4.267, "args": { "External id": 14998,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650522056.963, "dur": 2.708, "args": { "External id": 14999,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650522062.648, "dur": 2.234, "args": { "External id": 15000,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650522063.619, "dur": 1.156, "args": { "External id": 15001,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650522096.983, "dur": 103.164, "args": { "External id": 15002,"Sequence number": 246692, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650522105.330, "dur": 8.774, "args": { "External id": 15003,"Sequence number": 246692, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8498 } }, { "ph": "s", "id": 76, "pid": 1336759, "tid": 1336759, "ts": 1295650522105.330, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650522109.029, "dur": 4.078, "args": { "External id": 15004,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650522111.239, "dur": 1.600, "args": { "External id": 15005,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650522114.980, "dur": 84.927, "args": { "External id": 15006,"Sequence number": 246693, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650522116.447, "dur": 6.438, "args": { "External id": 15007,"Sequence number": 246693, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650522117.316, "dur": 5.426, "args": { "External id": 15008,"Sequence number": 246693, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8503 } }, { "ph": "s", "id": 75, "pid": 1336759, "tid": 1336759, "ts": 1295650522117.316, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650522123.790, "dur": 67.329, "args": { "External id": 15009,"Sequence number": 246694, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8504 } }, { "ph": "s", "id": 74, "pid": 1336759, "tid": 1336759, "ts": 1295650522123.790, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650522192.887, "dur": 6.513, "args": { "External id": 15010,"Sequence number": 246695, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8505 } }, { "ph": "s", "id": 73, "pid": 1336759, "tid": 1336759, "ts": 1295650522192.887, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650522207.768, "dur": 85.228, "args": { "External id": 15011,"Sequence number": 246696, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650522208.527, "dur": 6.862, "args": { "External id": 15012,"Sequence number": 246696, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8507 } }, { "ph": "s", "id": 72, "pid": 1336759, "tid": 1336759, "ts": 1295650522208.527, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650522210.587, "dur": 3.733, "args": { "External id": 15013,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650522213.207, "dur": 0.932, "args": { "External id": 15014,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650522215.871, "dur": 76.916, "args": { "External id": 15015,"Sequence number": 246697, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650522216.847, "dur": 3.944, "args": { "External id": 15016,"Sequence number": 246697, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650522217.448, "dur": 3.197, "args": { "External id": 15017,"Sequence number": 246697, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8512 } }, { "ph": "s", "id": 71, "pid": 1336759, "tid": 1336759, "ts": 1295650522217.448, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650522222.624, "dur": 64.798, "args": { "External id": 15018,"Sequence number": 246698, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8513 } }, { "ph": "s", "id": 70, "pid": 1336759, "tid": 1336759, "ts": 1295650522222.624, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650522289.733, "dur": 2.600, "args": { "External id": 15019,"Sequence number": 246699, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8514 } }, { "ph": "s", "id": 69, "pid": 1336759, "tid": 1336759, "ts": 1295650522289.733, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650522314.205, "dur": 139.610, "args": { "External id": 15020,"Sequence number": 246700, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8515 } }, { "ph": "s", "id": 68, "pid": 1336759, "tid": 1336759, "ts": 1295650522314.205, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650522350.519, "dur": 4.529, "args": { "External id": 15021,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8516 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650522385.764, "dur": 55.207, "args": { "External id": 15022,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8517 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650522386.534, "dur": 5.173, "args": { "External id": 15023,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 8518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650522387.614, "dur": 3.131, "args": { "External id": 15024,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 8519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650522389.645, "dur": 0.943, "args": { "External id": 15025,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 8520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650522392.354, "dur": 48.297, "args": { "External id": 15026,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[23068672, 5632, 1], [1, 5632]], "Input Dims": [[16, 4096, 5632], [5632, 2048]], "Ev Idx": 8521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650522393.490, "dur": 2.280, "args": { "External id": 15027,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650522394.333, "dur": 1.301, "args": { "External id": 15028,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650522397.936, "dur": 39.591, "args": { "External id": 15029,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 8524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650522439.177, "dur": 0.896, "args": { "External id": 15030,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336759, "tid": 1336759, "ts": 1295650522461.862, "dur": 23.936, "args": { "External id": 15031,"Sequence number": 246701, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 8526 } }, { "ph": "s", "id": 67, "pid": 1336759, "tid": 1336759, "ts": 1295650522461.862, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650522516.862, "dur": 172.724, "args": { "External id": 15032,"Sequence number": 246702, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [], [], [], [], []], "Ev Idx": 8527 } }, { "ph": "s", "id": 66, "pid": 1336759, "tid": 1336759, "ts": 1295650522516.862, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650522533.750, "dur": 3.466, "args": { "External id": 15033,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650522535.090, "dur": 2.009, "args": { "External id": 15034,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650522546.963, "dur": 8.401, "args": { "External id": 15035,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650522550.519, "dur": 4.431, "args": { "External id": 15036,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650522564.902, "dur": 5.018, "args": { "External id": 15037,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650522678.089, "dur": 2.397, "args": { "External id": 15038,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650522678.948, "dur": 1.364, "args": { "External id": 15039,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650522706.695, "dur": 94.678, "args": { "External id": 15040,"Sequence number": 246703, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650522707.399, "dur": 6.899, "args": { "External id": 15041,"Sequence number": 246703, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8536 } }, { "ph": "s", "id": 65, "pid": 1336759, "tid": 1336759, "ts": 1295650522707.399, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650522708.933, "dur": 4.227, "args": { "External id": 15042,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650522711.800, "dur": 1.154, "args": { "External id": 15043,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650522715.066, "dur": 86.076, "args": { "External id": 15044,"Sequence number": 246704, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650522716.167, "dur": 3.258, "args": { "External id": 15045,"Sequence number": 246704, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650522717.002, "dur": 2.292, "args": { "External id": 15046,"Sequence number": 246704, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8541 } }, { "ph": "s", "id": 64, "pid": 1336759, "tid": 1336759, "ts": 1295650522717.002, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650522721.752, "dur": 74.439, "args": { "External id": 15047,"Sequence number": 246705, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8542 } }, { "ph": "s", "id": 63, "pid": 1336759, "tid": 1336759, "ts": 1295650522721.752, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650522798.002, "dur": 2.523, "args": { "External id": 15048,"Sequence number": 246706, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8543 } }, { "ph": "s", "id": 62, "pid": 1336759, "tid": 1336759, "ts": 1295650522798.002, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650522808.978, "dur": 79.059, "args": { "External id": 15049,"Sequence number": 246707, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650522809.586, "dur": 7.867, "args": { "External id": 15050,"Sequence number": 246707, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8545 } }, { "ph": "s", "id": 61, "pid": 1336759, "tid": 1336759, "ts": 1295650522809.586, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650522811.053, "dur": 5.344, "args": { "External id": 15051,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650522813.939, "dur": 2.220, "args": { "External id": 15052,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650522817.985, "dur": 69.856, "args": { "External id": 15053,"Sequence number": 246708, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650522818.811, "dur": 3.110, "args": { "External id": 15054,"Sequence number": 246708, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650522819.713, "dur": 2.069, "args": { "External id": 15055,"Sequence number": 246708, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8550 } }, { "ph": "s", "id": 60, "pid": 1336759, "tid": 1336759, "ts": 1295650522819.713, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650522822.506, "dur": 57.293, "args": { "External id": 15056,"Sequence number": 246709, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8551 } }, { "ph": "s", "id": 59, "pid": 1336759, "tid": 1336759, "ts": 1295650522822.506, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650522881.277, "dur": 6.087, "args": { "External id": 15057,"Sequence number": 246710, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8552 } }, { "ph": "s", "id": 58, "pid": 1336759, "tid": 1336759, "ts": 1295650522881.277, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650522894.689, "dur": 71.535, "args": { "External id": 15058,"Sequence number": 246711, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650522895.135, "dur": 5.126, "args": { "External id": 15059,"Sequence number": 246711, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8554 } }, { "ph": "s", "id": 57, "pid": 1336759, "tid": 1336759, "ts": 1295650522895.135, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650522896.707, "dur": 2.468, "args": { "External id": 15060,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650522898.275, "dur": 0.758, "args": { "External id": 15061,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650522902.306, "dur": 63.741, "args": { "External id": 15062,"Sequence number": 246712, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650522903.246, "dur": 4.135, "args": { "External id": 15063,"Sequence number": 246712, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650522903.860, "dur": 3.395, "args": { "External id": 15064,"Sequence number": 246712, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8559 } }, { "ph": "s", "id": 56, "pid": 1336759, "tid": 1336759, "ts": 1295650522903.860, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650522907.852, "dur": 53.030, "args": { "External id": 15065,"Sequence number": 246713, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8560 } }, { "ph": "s", "id": 55, "pid": 1336759, "tid": 1336759, "ts": 1295650522907.852, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650522962.581, "dur": 3.080, "args": { "External id": 15066,"Sequence number": 246714, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8561 } }, { "ph": "s", "id": 54, "pid": 1336759, "tid": 1336759, "ts": 1295650522962.581, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650522980.021, "dur": 3.576, "args": { "External id": 15067,"Sequence number": 246715, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650522980.917, "dur": 2.481, "args": { "External id": 15068,"Sequence number": 246715, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8563 } }, { "ph": "s", "id": 53, "pid": 1336759, "tid": 1336759, "ts": 1295650522980.917, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650523032.096, "dur": 4.224, "args": { "External id": 15069,"Sequence number": 246716, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650523032.912, "dur": 3.181, "args": { "External id": 15070,"Sequence number": 246716, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8565 } }, { "ph": "s", "id": 52, "pid": 1336759, "tid": 1336759, "ts": 1295650523032.912, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650523041.976, "dur": 4.725, "args": { "External id": 15071,"Sequence number": 246717, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650523043.003, "dur": 3.538, "args": { "External id": 15072,"Sequence number": 246717, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8567 } }, { "ph": "s", "id": 51, "pid": 1336759, "tid": 1336759, "ts": 1295650523043.003, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650523075.965, "dur": 175.273, "args": { "External id": 15073,"Sequence number": 246718, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8568 } }, { "ph": "s", "id": 50, "pid": 1336759, "tid": 1336759, "ts": 1295650523075.965, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650523094.679, "dur": 8.518, "args": { "External id": 15074,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650523096.977, "dur": 5.766, "args": { "External id": 15075,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8570 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650523265.134, "dur": 110.891, "args": { "External id": 15076,"Sequence number": 246719, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8571 } }, { "ph": "s", "id": 49, "pid": 1336759, "tid": 1336759, "ts": 1295650523265.134, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650523280.409, "dur": 8.240, "args": { "External id": 15077,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650523282.632, "dur": 5.641, "args": { "External id": 15078,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8573 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 1336759, "tid": 1336759, "ts": 1295650523402.713, "dur": 172.381, "args": { "External id": 15079,"Sequence number": 246720, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 8574 } }, { "ph": "s", "id": 48, "pid": 1336759, "tid": 1336759, "ts": 1295650523402.713, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650523430.898, "dur": 119.003, "args": { "External id": 15080,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650523479.510, "dur": 6.681, "args": { "External id": 15081,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650523481.742, "dur": 4.082, "args": { "External id": 15082,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650523488.795, "dur": 3.966, "args": { "External id": 15083,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650523493.806, "dur": 2.799, "args": { "External id": 15084,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650523499.279, "dur": 3.290, "args": { "External id": 15085,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336759, "tid": 1336759, "ts": 1295650523560.620, "dur": 4.753, "args": { "External id": 15086,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 8581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650523579.374, "dur": 5.695, "args": { "External id": 15087,"Sequence number": 246721, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650523581.048, "dur": 3.835, "args": { "External id": 15088,"Sequence number": 246721, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8583 } }, { "ph": "s", "id": 47, "pid": 1336759, "tid": 1336759, "ts": 1295650523581.048, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650523596.286, "dur": 96.621, "args": { "External id": 15089,"Sequence number": 246722, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650523598.969, "dur": 7.720, "args": { "External id": 15090,"Sequence number": 246722, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8585 } }, { "ph": "s", "id": 46, "pid": 1336759, "tid": 1336759, "ts": 1295650523598.969, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650523601.195, "dur": 4.536, "args": { "External id": 15091,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650523603.708, "dur": 1.756, "args": { "External id": 15092,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650523608.034, "dur": 84.558, "args": { "External id": 15093,"Sequence number": 246723, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650523609.609, "dur": 3.932, "args": { "External id": 15094,"Sequence number": 246723, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650523611.545, "dur": 1.867, "args": { "External id": 15095,"Sequence number": 246723, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8590 } }, { "ph": "s", "id": 45, "pid": 1336759, "tid": 1336759, "ts": 1295650523611.545, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650523614.539, "dur": 72.177, "args": { "External id": 15096,"Sequence number": 246724, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8591 } }, { "ph": "s", "id": 44, "pid": 1336759, "tid": 1336759, "ts": 1295650523614.539, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650523688.776, "dur": 3.217, "args": { "External id": 15097,"Sequence number": 246725, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8592 } }, { "ph": "s", "id": 43, "pid": 1336759, "tid": 1336759, "ts": 1295650523688.776, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650523722.477, "dur": 189.923, "args": { "External id": 15098,"Sequence number": 246726, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [16, 4096, 2048], [], [], [], []], "Ev Idx": 8593 } }, { "ph": "s", "id": 42, "pid": 1336759, "tid": 1336759, "ts": 1295650523722.477, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650523740.803, "dur": 3.316, "args": { "External id": 15099,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650523741.756, "dur": 2.216, "args": { "External id": 15100,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 1336759, "tid": 1336759, "ts": 1295650523747.892, "dur": 2.812, "args": { "External id": 15101,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [2048, 1]], "Input Dims": [[16, 4096, 2048], [65536, 2048]], "Ev Idx": 8596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650523748.998, "dur": 1.594, "args": { "External id": 15102,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650523749.563, "dur": 0.892, "args": { "External id": 15103,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650523757.676, "dur": 6.837, "args": { "External id": 15104,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650523760.159, "dur": 4.073, "args": { "External id": 15105,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650523770.058, "dur": 3.192, "args": { "External id": 15106,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650523776.518, "dur": 3.941, "args": { "External id": 15107,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650523892.658, "dur": 3.482, "args": { "External id": 15108,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650523893.895, "dur": 1.991, "args": { "External id": 15109,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650523898.381, "dur": 2.226, "args": { "External id": 15110,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650523899.611, "dur": 0.896, "args": { "External id": 15111,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650523928.516, "dur": 127.158, "args": { "External id": 15112,"Sequence number": 246727, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650523929.292, "dur": 7.302, "args": { "External id": 15113,"Sequence number": 246727, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8608 } }, { "ph": "s", "id": 41, "pid": 1336759, "tid": 1336759, "ts": 1295650523929.292, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650523930.696, "dur": 4.838, "args": { "External id": 15114,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650523932.218, "dur": 3.023, "args": { "External id": 15115,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650523937.656, "dur": 117.718, "args": { "External id": 15116,"Sequence number": 246728, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650523939.282, "dur": 5.033, "args": { "External id": 15117,"Sequence number": 246728, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650523941.762, "dur": 2.212, "args": { "External id": 15118,"Sequence number": 246728, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8613 } }, { "ph": "s", "id": 40, "pid": 1336759, "tid": 1336759, "ts": 1295650523941.762, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650523945.007, "dur": 101.088, "args": { "External id": 15119,"Sequence number": 246729, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8614 } }, { "ph": "s", "id": 39, "pid": 1336759, "tid": 1336759, "ts": 1295650523945.007, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650524049.890, "dur": 4.747, "args": { "External id": 15120,"Sequence number": 246730, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8615 } }, { "ph": "s", "id": 38, "pid": 1336759, "tid": 1336759, "ts": 1295650524049.890, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650524065.022, "dur": 73.696, "args": { "External id": 15121,"Sequence number": 246731, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650524065.642, "dur": 8.958, "args": { "External id": 15122,"Sequence number": 246731, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8617 } }, { "ph": "s", "id": 37, "pid": 1336759, "tid": 1336759, "ts": 1295650524065.642, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650524070.448, "dur": 2.996, "args": { "External id": 15123,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650524072.102, "dur": 1.156, "args": { "External id": 15124,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650524075.210, "dur": 63.309, "args": { "External id": 15125,"Sequence number": 246732, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650524075.953, "dur": 5.948, "args": { "External id": 15126,"Sequence number": 246732, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650524078.321, "dur": 3.460, "args": { "External id": 15127,"Sequence number": 246732, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8622 } }, { "ph": "s", "id": 36, "pid": 1336759, "tid": 1336759, "ts": 1295650524078.321, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650524082.557, "dur": 49.948, "args": { "External id": 15128,"Sequence number": 246733, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8623 } }, { "ph": "s", "id": 35, "pid": 1336759, "tid": 1336759, "ts": 1295650524082.557, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650524134.251, "dur": 3.933, "args": { "External id": 15129,"Sequence number": 246734, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8624 } }, { "ph": "s", "id": 34, "pid": 1336759, "tid": 1336759, "ts": 1295650524134.251, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650524157.450, "dur": 166.632, "args": { "External id": 15130,"Sequence number": 246735, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8625 } }, { "ph": "s", "id": 33, "pid": 1336759, "tid": 1336759, "ts": 1295650524157.450, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650524194.315, "dur": 4.835, "args": { "External id": 15131,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650524245.758, "dur": 65.222, "args": { "External id": 15132,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650524246.539, "dur": 7.832, "args": { "External id": 15133,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 8628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650524248.018, "dur": 5.049, "args": { "External id": 15134,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 8629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650524249.934, "dur": 2.711, "args": { "External id": 15135,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 8630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650524255.019, "dur": 55.676, "args": { "External id": 15136,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[23068672, 5632, 1], [1, 5632]], "Input Dims": [[16, 4096, 5632], [5632, 2048]], "Ev Idx": 8631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336759, "tid": 1336759, "ts": 1295650524256.611, "dur": 3.800, "args": { "External id": 15137,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650524258.821, "dur": 1.493, "args": { "External id": 15138,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650524261.156, "dur": 45.610, "args": { "External id": 15139,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 8634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336759, "tid": 1336759, "ts": 1295650524308.690, "dur": 1.309, "args": { "External id": 15140,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336759, "tid": 1336759, "ts": 1295650524332.926, "dur": 25.447, "args": { "External id": 15141,"Sequence number": 246736, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 8636 } }, { "ph": "s", "id": 32, "pid": 1336759, "tid": 1336759, "ts": 1295650524332.926, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::stack", "pid": 1336759, "tid": 1336759, "ts": 1295650524376.602, "dur": 37.931, "args": { "External id": 15142,"Sequence number": 246737, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "-2"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[[8388608, 2048, 1], [8388608, 2048, 1], [8388608, 2048, 1], [8388608, 2048, 1]], []], "Input Dims": [[[16, 4096, 2048], [16, 4096, 2048], [16, 4096, 2048], [16, 4096, 2048]], []], "Ev Idx": 8637 } }, { "ph": "s", "id": 31, "pid": 1336759, "tid": 1336759, "ts": 1295650524376.602, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::cat", "pid": 1336759, "tid": 1336759, "ts": 1295650524385.899, "dur": 24.873, "args": { "External id": 15143,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[[8388608, 2048, 1], [8388608, 2048, 1], [8388608, 2048, 1], [8388608, 2048, 1]], []], "Input Dims": [[[16, 4096, 2048], [16, 4096, 2048], [16, 4096, 2048], [16, 4096, 2048]], []], "Ev Idx": 8638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650524411.982, "dur": 1.329, "args": { "External id": 15144,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 8192], []], "Ev Idx": 8639 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336759, "tid": 1336759, "ts": 1295650524448.972, "dur": 37.665, "args": { "External id": 15145,"Record function id": 0, "Ev Idx": 8640 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 2/0", "pid": 1336759, "tid": 1336759, "ts": 1295650524487.703, "dur": 178.497, "args": { "External id": 15146,"Record function id": 0, "Ev Idx": 8641 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650524522.469, "dur": 135.650, "args": { "External id": 15147,"Sequence number": 246738, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1], [33554432, 8192, 2048, 1]], "Input Dims": [[2048], [16, 4096, 4, 2048]], "Ev Idx": 8642 } }, { "ph": "s", "id": 30, "pid": 1336759, "tid": 1336759, "ts": 1295650524522.469, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336759, "tid": 1336759, "ts": 1295650524587.945, "dur": 34.327, "args": { "External id": 15148,"kernel_hash": "cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/xq/cxq73k7hzeap6epyl22bkojjyhqsfjuzklwbe2qcgpfenip5hwvj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[262144, 2048], [262144, 2048], [2048], [262144], [], [], [], [], [], [], [], [], []], "Ev Idx": 8643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1336759, "ts": 1295650524745.281, "dur": 34.314, "args": { "External id": 15149,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False"], "Input type": ["ScalarList", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 8644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650524747.740, "dur": 4.631, "args": { "External id": 15150,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False", ""], "Input type": ["ScalarList", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1336759, "ts": 1295650524755.540, "dur": 23.739, "args": { "External id": 15151,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 8646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650524758.752, "dur": 20.024, "args": { "External id": 15152,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 8647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1336759, "ts": 1295650524783.642, "dur": 16.465, "args": { "External id": 15153,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False"], "Input type": ["ScalarList", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 8648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650524784.510, "dur": 2.758, "args": { "External id": 15154,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False", ""], "Input type": ["ScalarList", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1336759, "ts": 1295650524789.360, "dur": 10.481, "args": { "External id": 15155,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 8650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650524790.045, "dur": 9.376, "args": { "External id": 15156,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 8651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1336759, "ts": 1295650524803.068, "dur": 13.863, "args": { "External id": 15157,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False"], "Input type": ["ScalarList", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 8652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650524803.785, "dur": 2.470, "args": { "External id": 15158,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False", ""], "Input type": ["ScalarList", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1336759, "ts": 1295650524806.703, "dur": 9.963, "args": { "External id": 15159,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 8654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650524807.057, "dur": 9.270, "args": { "External id": 15160,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 8655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650524827.114, "dur": 0.838, "args": { "External id": 15161,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], [], [], [], []], "Ev Idx": 8656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unfold", "pid": 1336759, "tid": 1336759, "ts": 1295650524834.936, "dur": 10.600, "args": { "External id": 15162,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "5", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 8657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650524841.912, "dur": 2.218, "args": { "External id": 15163,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 5]", "[8192, 1, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 8658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650524851.737, "dur": 6.372, "args": { "External id": 15164,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 5], [], [], [], []], "Ev Idx": 8659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650524855.565, "dur": 0.967, "args": { "External id": 15165,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 5]", "[8192, 1, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 5], [], [], []], "Ev Idx": 8660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650524859.251, "dur": 2.996, "args": { "External id": 15166,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 5], [], [], [], []], "Ev Idx": 8661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650524860.917, "dur": 0.663, "args": { "External id": 15167,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 5]", "[8192, 1, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 5], [], [], []], "Ev Idx": 8662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650524863.513, "dur": 2.885, "args": { "External id": 15168,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "1", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 5], [], [], [], []], "Ev Idx": 8663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650524865.255, "dur": 0.623, "args": { "External id": 15169,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 5], [], [], []], "Ev Idx": 8664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650524869.340, "dur": 2.960, "args": { "External id": 15170,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 4], [], [], [], []], "Ev Idx": 8665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650524870.869, "dur": 0.820, "args": { "External id": 15171,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 4], [], [], []], "Ev Idx": 8666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650524873.337, "dur": 3.000, "args": { "External id": 15172,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "4096", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 4], [], [], [], []], "Ev Idx": 8667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650524874.883, "dur": 0.795, "args": { "External id": 15173,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 4], [], [], []], "Ev Idx": 8668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650524877.269, "dur": 2.914, "args": { "External id": 15174,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4096, 4], [], [], [], []], "Ev Idx": 8669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650524879.194, "dur": 0.482, "args": { "External id": 15175,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4096, 4], [], [], []], "Ev Idx": 8670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650524883.824, "dur": 5.208, "args": { "External id": 15176,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "2"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4096, 4], [], []], "Ev Idx": 8671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650524887.508, "dur": 0.785, "args": { "External id": 15177,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4096, 4], [], [], []], "Ev Idx": 8672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650524892.965, "dur": 2.917, "args": { "External id": 15178,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 8673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650524894.708, "dur": 0.589, "args": { "External id": 15179,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 8674 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336759, "tid": 1336759, "ts": 1295650524901.261, "dur": 8.331, "args": { "External id": 15180,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 8675 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650524907.414, "dur": 0.842, "args": { "External id": 15181,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 8676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650524910.545, "dur": 2.852, "args": { "External id": 15182,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 8677 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650524912.103, "dur": 0.759, "args": { "External id": 15183,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 8678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650524915.798, "dur": 6.935, "args": { "External id": 15184,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 8679 } }, { "ph": "s", "id": 29, "pid": 1336759, "tid": 1336759, "ts": 1295650524915.798, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650524920.405, "dur": 0.850, "args": { "External id": 15185,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 8680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650524923.699, "dur": 4.617, "args": { "External id": 15186,"Sequence number": 246740, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 8681 } }, { "ph": "s", "id": 28, "pid": 1336759, "tid": 1336759, "ts": 1295650524923.699, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650524926.929, "dur": 0.592, "args": { "External id": 15187,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 8682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336759, "tid": 1336759, "ts": 1295650524929.225, "dur": 5.694, "args": { "External id": 15188,"Sequence number": 246741, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 8683 } }, { "ph": "s", "id": 27, "pid": 1336759, "tid": 1336759, "ts": 1295650524929.225, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650524933.518, "dur": 0.551, "args": { "External id": 15189,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 8684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650524935.849, "dur": 5.651, "args": { "External id": 15190,"Sequence number": 246742, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 8685 } }, { "ph": "s", "id": 26, "pid": 1336759, "tid": 1336759, "ts": 1295650524935.849, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650524938.317, "dur": 2.315, "args": { "External id": 15191,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 8686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336759, "tid": 1336759, "ts": 1295650524947.641, "dur": 79.415, "args": { "External id": 15192,"Sequence number": 246743, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 8687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1336759, "ts": 1295650524950.024, "dur": 76.797, "args": { "External id": 15193,"Sequence number": 246743, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 8688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650524952.616, "dur": 5.152, "args": { "External id": 15194,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 8689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650524954.332, "dur": 2.845, "args": { "External id": 15195,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650524959.434, "dur": 66.339, "args": { "External id": 15196,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 8691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650525054.142, "dur": 5.198, "args": { "External id": 15197,"Sequence number": 246743, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8692 } }, { "ph": "s", "id": 25, "pid": 1336759, "tid": 1336759, "ts": 1295650525054.142, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650525061.559, "dur": 1.118, "args": { "External id": 15198,"Sequence number": 246744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 8693 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650525090.504, "dur": 72267.467, "args": { "External id": 15199,"Sequence number": 246744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [1], [2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536], [32000, 2048], [], [], [], [], []], "Ev Idx": 8694 } }, { "ph": "s", "id": 24, "pid": 1336759, "tid": 1336759, "ts": 1295650525090.504, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336759, "tid": 1336759, "ts": 1295650525105.353, "dur": 33.843, "args": { "External id": 15200,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1336759, "ts": 1295650525106.008, "dur": 32.960, "args": { "External id": 15201,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650525107.341, "dur": 7.954, "args": { "External id": 15202,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650525108.883, "dur": 5.997, "args": { "External id": 15203,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650525116.156, "dur": 22.449, "args": { "External id": 15204,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [8192, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 8699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336759, "tid": 1336759, "ts": 1295650525157.144, "dur": 24.949, "args": { "External id": 15205,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650525159.007, "dur": 6.231, "args": { "External id": 15206,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650525160.849, "dur": 4.020, "args": { "External id": 15207,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1336759, "ts": 1295650525166.166, "dur": 15.711, "args": { "External id": 15208,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 8703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650525167.268, "dur": 14.253, "args": { "External id": 15209,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336759, "tid": 1336759, "ts": 1295650525185.458, "dur": 26.184, "args": { "External id": 15210,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 8705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650525186.094, "dur": 5.922, "args": { "External id": 15211,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 8706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650525188.885, "dur": 2.928, "args": { "External id": 15212,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1336759, "ts": 1295650525201.101, "dur": 10.347, "args": { "External id": 15213,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650525201.811, "dur": 9.293, "args": { "External id": 15214,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[32000, 2048], []], "Ev Idx": 8709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1336759, "ts": 1295650525215.770, "dur": 32.712, "args": { "External id": 15215,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 8710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650525216.997, "dur": 4.702, "args": { "External id": 15216,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1336759, "ts": 1295650525222.262, "dur": 25.945, "args": { "External id": 15217,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 8712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650525222.798, "dur": 24.519, "args": { "External id": 15218,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336759, "tid": 1336759, "ts": 1295650525259.222, "dur": 29.973, "args": { "External id": 15219,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650525294.390, "dur": 58.521, "args": { "External id": 15220,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650525298.750, "dur": 53.767, "args": { "External id": 15221,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650525305.779, "dur": 1.127, "args": { "External id": 15222,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650525308.372, "dur": 25.037, "args": { "External id": 15223,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8718 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650525310.394, "dur": 22.781, "args": { "External id": 15224,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 8719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650525314.712, "dur": 3.034, "args": { "External id": 15225,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8720 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650525318.606, "dur": 14.176, "args": { "External id": 15226,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 8721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336759, "tid": 1336759, "ts": 1295650525358.194, "dur": 66231.634, "args": { "External id": 15227,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 8722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336759, "tid": 1336759, "ts": 1295650525360.472, "dur": 66226.932, "args": { "External id": 15228,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 8723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650591611.169, "dur": 13.770, "args": { "External id": 15229,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650591620.064, "dur": 2.063, "args": { "External id": 15230,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650591631.329, "dur": 126.382, "args": { "External id": 15231,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650591635.146, "dur": 10.783, "args": { "External id": 15232,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650591637.954, "dur": 7.087, "args": { "External id": 15233,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8728 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650591643.939, "dur": 0.797, "args": { "External id": 15234,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650591647.640, "dur": 109.018, "args": { "External id": 15235,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650591649.962, "dur": 105.428, "args": { "External id": 15236,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650591762.030, "dur": 5.125, "args": { "External id": 15237,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650591764.565, "dur": 0.956, "args": { "External id": 15238,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650591779.568, "dur": 4.425, "args": { "External id": 15239,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650591796.659, "dur": 8.379, "args": { "External id": 15240,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650591799.114, "dur": 5.640, "args": { "External id": 15241,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650591951.886, "dur": 291.661, "args": { "External id": 15242,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650591957.319, "dur": 2.825, "args": { "External id": 15243,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650591963.105, "dur": 279.761, "args": { "External id": 15244,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650591968.782, "dur": 0.793, "args": { "External id": 15245,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650591973.111, "dur": 64.030, "args": { "External id": 15246,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650592040.595, "dur": 6.349, "args": { "External id": 15247,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650592045.120, "dur": 1.409, "args": { "External id": 15248,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650592048.797, "dur": 25.892, "args": { "External id": 15249,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650592050.337, "dur": 1.738, "args": { "External id": 15250,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650592054.478, "dur": 19.884, "args": { "External id": 15251,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650592058.857, "dur": 3.506, "args": { "External id": 15252,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650592077.507, "dur": 25.253, "args": { "External id": 15253,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650592105.761, "dur": 20.939, "args": { "External id": 15254,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650592132.264, "dur": 18.300, "args": { "External id": 15255,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650592153.598, "dur": 16.048, "args": { "External id": 15256,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650592172.153, "dur": 22.444, "args": { "External id": 15257,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650592175.079, "dur": 1.452, "args": { "External id": 15258,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650592179.078, "dur": 0.833, "args": { "External id": 15259,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650592197.175, "dur": 15.576, "args": { "External id": 15260,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650592216.309, "dur": 24.484, "args": { "External id": 15261,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650592253.295, "dur": 3.104, "args": { "External id": 15262,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650592265.016, "dur": 5.017, "args": { "External id": 15263,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650592267.990, "dur": 1.064, "args": { "External id": 15264,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650592361.678, "dur": 79.518, "args": { "External id": 15265,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650592447.191, "dur": 5.710, "args": { "External id": 15266,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650592450.351, "dur": 1.038, "args": { "External id": 15267,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650592455.110, "dur": 30.784, "args": { "External id": 15268,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650592494.053, "dur": 6.623, "args": { "External id": 15269,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650592495.930, "dur": 4.034, "args": { "External id": 15270,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650592498.235, "dur": 1.489, "args": { "External id": 15271,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650592505.066, "dur": 45.092, "args": { "External id": 15272,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650592506.363, "dur": 43.340, "args": { "External id": 15273,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650592555.844, "dur": 18.216, "args": { "External id": 15274,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650592579.725, "dur": 5.196, "args": { "External id": 15275,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650592583.009, "dur": 1.144, "args": { "External id": 15276,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650592589.421, "dur": 51.354, "args": { "External id": 15277,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650592590.581, "dur": 3.785, "args": { "External id": 15278,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650592591.440, "dur": 2.341, "args": { "External id": 15279,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650592592.719, "dur": 0.910, "args": { "External id": 15280,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650592595.202, "dur": 45.202, "args": { "External id": 15281,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650592597.356, "dur": 42.529, "args": { "External id": 15282,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650592645.155, "dur": 4.041, "args": { "External id": 15283,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650592647.050, "dur": 0.864, "args": { "External id": 15284,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650592655.566, "dur": 1.693, "args": { "External id": 15285,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650592665.400, "dur": 9.724, "args": { "External id": 15286,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650592669.311, "dur": 5.500, "args": { "External id": 15287,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650592769.346, "dur": 179.445, "args": { "External id": 15288,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650592771.559, "dur": 2.228, "args": { "External id": 15289,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650592775.775, "dur": 172.429, "args": { "External id": 15290,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650592777.679, "dur": 0.450, "args": { "External id": 15291,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650592779.575, "dur": 23.207, "args": { "External id": 15292,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650592804.331, "dur": 3.053, "args": { "External id": 15293,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650592806.236, "dur": 0.923, "args": { "External id": 15294,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650592808.417, "dur": 24.727, "args": { "External id": 15295,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650592810.737, "dur": 1.441, "args": { "External id": 15296,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650592813.883, "dur": 19.000, "args": { "External id": 15297,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650592818.559, "dur": 3.133, "args": { "External id": 15298,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650592835.313, "dur": 20.314, "args": { "External id": 15299,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650592857.177, "dur": 12.815, "args": { "External id": 15300,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650592873.012, "dur": 12.754, "args": { "External id": 15301,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650592887.321, "dur": 12.436, "args": { "External id": 15302,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650592901.443, "dur": 20.830, "args": { "External id": 15303,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650592903.761, "dur": 1.753, "args": { "External id": 15304,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650592908.797, "dur": 0.884, "args": { "External id": 15305,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650592923.658, "dur": 11.507, "args": { "External id": 15306,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650592936.241, "dur": 10.567, "args": { "External id": 15307,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650592955.646, "dur": 2.002, "args": { "External id": 15308,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650592966.389, "dur": 2.974, "args": { "External id": 15309,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650592968.255, "dur": 0.432, "args": { "External id": 15310,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650593079.092, "dur": 57.711, "args": { "External id": 15311,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650593142.345, "dur": 7.897, "args": { "External id": 15312,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650593147.035, "dur": 1.814, "args": { "External id": 15313,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650593151.766, "dur": 25.257, "args": { "External id": 15314,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650593181.832, "dur": 5.379, "args": { "External id": 15315,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650593183.457, "dur": 3.092, "args": { "External id": 15316,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650593185.289, "dur": 1.028, "args": { "External id": 15317,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650593189.897, "dur": 55.557, "args": { "External id": 15318,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650593192.475, "dur": 51.935, "args": { "External id": 15319,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650593251.445, "dur": 16.666, "args": { "External id": 15320,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650593274.656, "dur": 4.609, "args": { "External id": 15321,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650593277.241, "dur": 1.066, "args": { "External id": 15322,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650593283.060, "dur": 55.882, "args": { "External id": 15323,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650593283.969, "dur": 7.354, "args": { "External id": 15324,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650593284.789, "dur": 5.941, "args": { "External id": 15325,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650593288.197, "dur": 2.306, "args": { "External id": 15326,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650593292.081, "dur": 46.325, "args": { "External id": 15327,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650593292.690, "dur": 45.273, "args": { "External id": 15328,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650593343.210, "dur": 4.104, "args": { "External id": 15329,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650593345.329, "dur": 0.706, "args": { "External id": 15330,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650593353.666, "dur": 1.753, "args": { "External id": 15331,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650593363.108, "dur": 7.673, "args": { "External id": 15332,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650593366.539, "dur": 3.951, "args": { "External id": 15333,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650593460.036, "dur": 281.208, "args": { "External id": 15334,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650593462.582, "dur": 2.501, "args": { "External id": 15335,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650593466.545, "dur": 274.243, "args": { "External id": 15336,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650593467.889, "dur": 0.390, "args": { "External id": 15337,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650593471.129, "dur": 20.803, "args": { "External id": 15338,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650593493.454, "dur": 3.471, "args": { "External id": 15339,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650593495.467, "dur": 1.121, "args": { "External id": 15340,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650593497.692, "dur": 23.520, "args": { "External id": 15341,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650593500.034, "dur": 3.274, "args": { "External id": 15342,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650593504.495, "dur": 16.445, "args": { "External id": 15343,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650593507.068, "dur": 2.576, "args": { "External id": 15344,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650593522.610, "dur": 20.654, "args": { "External id": 15345,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650593544.610, "dur": 13.832, "args": { "External id": 15346,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650593560.707, "dur": 15.220, "args": { "External id": 15347,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650593577.558, "dur": 32.165, "args": { "External id": 15348,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650593611.316, "dur": 42.712, "args": { "External id": 15349,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650593613.296, "dur": 1.806, "args": { "External id": 15350,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650593618.236, "dur": 0.622, "args": { "External id": 15351,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650593655.686, "dur": 43.449, "args": { "External id": 15352,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650593700.106, "dur": 39.644, "args": { "External id": 15353,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650593747.770, "dur": 1.967, "args": { "External id": 15354,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650593758.050, "dur": 3.183, "args": { "External id": 15355,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650593759.937, "dur": 0.540, "args": { "External id": 15356,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650593825.863, "dur": 51.616, "args": { "External id": 15357,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650593883.781, "dur": 5.235, "args": { "External id": 15358,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650593886.746, "dur": 1.041, "args": { "External id": 15359,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650593890.496, "dur": 22.845, "args": { "External id": 15360,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650593951.314, "dur": 6.673, "args": { "External id": 15361,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650593952.984, "dur": 4.306, "args": { "External id": 15362,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650593954.799, "dur": 2.251, "args": { "External id": 15363,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650593961.932, "dur": 84.519, "args": { "External id": 15364,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650593962.752, "dur": 82.311, "args": { "External id": 15365,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650594052.630, "dur": 16.900, "args": { "External id": 15366,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650594076.681, "dur": 4.682, "args": { "External id": 15367,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650594079.463, "dur": 0.827, "args": { "External id": 15368,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650594085.388, "dur": 51.134, "args": { "External id": 15369,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650594086.299, "dur": 4.905, "args": { "External id": 15370,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650594088.541, "dur": 2.147, "args": { "External id": 15371,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650594089.837, "dur": 0.694, "args": { "External id": 15372,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650594091.875, "dur": 44.239, "args": { "External id": 15373,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650594092.624, "dur": 42.824, "args": { "External id": 15374,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650594140.786, "dur": 3.913, "args": { "External id": 15375,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650594142.864, "dur": 0.690, "args": { "External id": 15376,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650594153.234, "dur": 1.661, "args": { "External id": 15377,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650594163.115, "dur": 6.458, "args": { "External id": 15378,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650594164.945, "dur": 4.311, "args": { "External id": 15379,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650594286.753, "dur": 182.410, "args": { "External id": 15380,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650594289.444, "dur": 3.463, "args": { "External id": 15381,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650594296.633, "dur": 172.076, "args": { "External id": 15382,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650594299.499, "dur": 0.435, "args": { "External id": 15383,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650594300.932, "dur": 23.246, "args": { "External id": 15384,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650594325.866, "dur": 4.847, "args": { "External id": 15385,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650594327.916, "dur": 2.450, "args": { "External id": 15386,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650594331.635, "dur": 20.838, "args": { "External id": 15387,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650594332.737, "dur": 1.727, "args": { "External id": 15388,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650594335.669, "dur": 16.534, "args": { "External id": 15389,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650594338.527, "dur": 2.603, "args": { "External id": 15390,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650594354.195, "dur": 21.156, "args": { "External id": 15391,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650594376.639, "dur": 13.517, "args": { "External id": 15392,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650594394.793, "dur": 12.910, "args": { "External id": 15393,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650594409.080, "dur": 12.572, "args": { "External id": 15394,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650594423.570, "dur": 19.041, "args": { "External id": 15395,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650594425.702, "dur": 1.657, "args": { "External id": 15396,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650594429.392, "dur": 0.708, "args": { "External id": 15397,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650594443.939, "dur": 11.164, "args": { "External id": 15398,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650594458.252, "dur": 9.371, "args": { "External id": 15399,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650594476.089, "dur": 2.294, "args": { "External id": 15400,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650594487.741, "dur": 3.694, "args": { "External id": 15401,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650594490.145, "dur": 0.456, "args": { "External id": 15402,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650594561.762, "dur": 54.274, "args": { "External id": 15403,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650594620.714, "dur": 6.103, "args": { "External id": 15404,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650594623.233, "dur": 2.400, "args": { "External id": 15405,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650594628.480, "dur": 24.325, "args": { "External id": 15406,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650594657.253, "dur": 6.353, "args": { "External id": 15407,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650594660.369, "dur": 2.666, "args": { "External id": 15408,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650594662.127, "dur": 0.692, "args": { "External id": 15409,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650594665.932, "dur": 38.648, "args": { "External id": 15410,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650594667.070, "dur": 36.934, "args": { "External id": 15411,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650594708.449, "dur": 13.173, "args": { "External id": 15412,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650594727.229, "dur": 4.446, "args": { "External id": 15413,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650594730.242, "dur": 0.711, "args": { "External id": 15414,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650594735.221, "dur": 45.511, "args": { "External id": 15415,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8910 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650594735.968, "dur": 3.430, "args": { "External id": 15416,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650594736.719, "dur": 2.125, "args": { "External id": 15417,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650594738.086, "dur": 0.633, "args": { "External id": 15418,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650594739.873, "dur": 40.466, "args": { "External id": 15419,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650594740.357, "dur": 39.248, "args": { "External id": 15420,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650594784.736, "dur": 3.237, "args": { "External id": 15421,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650594786.345, "dur": 0.570, "args": { "External id": 15422,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650594794.752, "dur": 1.437, "args": { "External id": 15423,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650594802.898, "dur": 6.256, "args": { "External id": 15424,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650594804.607, "dur": 4.256, "args": { "External id": 15425,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650594888.486, "dur": 206.628, "args": { "External id": 15426,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650594890.680, "dur": 3.458, "args": { "External id": 15427,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650594896.735, "dur": 197.727, "args": { "External id": 15428,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650594897.782, "dur": 0.363, "args": { "External id": 15429,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650594899.275, "dur": 18.376, "args": { "External id": 15430,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650594919.191, "dur": 4.973, "args": { "External id": 15431,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650594923.122, "dur": 0.749, "args": { "External id": 15432,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650594924.846, "dur": 18.644, "args": { "External id": 15433,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650594925.521, "dur": 1.677, "args": { "External id": 15434,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650594928.155, "dur": 15.095, "args": { "External id": 15435,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650594930.359, "dur": 2.391, "args": { "External id": 15436,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650594944.954, "dur": 18.401, "args": { "External id": 15437,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650594964.415, "dur": 11.223, "args": { "External id": 15438,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650594979.419, "dur": 49.842, "args": { "External id": 15439,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650595031.455, "dur": 12.443, "args": { "External id": 15440,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650595045.968, "dur": 21.897, "args": { "External id": 15441,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650595049.599, "dur": 1.919, "args": { "External id": 15442,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650595053.592, "dur": 0.985, "args": { "External id": 15443,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650595069.496, "dur": 11.151, "args": { "External id": 15444,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650595082.949, "dur": 10.653, "args": { "External id": 15445,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650595102.492, "dur": 2.288, "args": { "External id": 15446,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650595114.564, "dur": 3.667, "args": { "External id": 15447,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650595117.012, "dur": 0.474, "args": { "External id": 15448,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650595185.609, "dur": 72.654, "args": { "External id": 15449,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650595264.851, "dur": 5.708, "args": { "External id": 15450,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650595267.926, "dur": 1.035, "args": { "External id": 15451,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650595271.951, "dur": 25.544, "args": { "External id": 15452,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650595303.928, "dur": 5.868, "args": { "External id": 15453,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650595305.288, "dur": 3.780, "args": { "External id": 15454,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650595307.431, "dur": 1.438, "args": { "External id": 15455,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650595312.773, "dur": 43.747, "args": { "External id": 15456,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650595314.088, "dur": 41.608, "args": { "External id": 15457,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650595360.508, "dur": 13.888, "args": { "External id": 15458,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650595379.774, "dur": 4.837, "args": { "External id": 15459,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650595383.211, "dur": 0.689, "args": { "External id": 15460,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650595388.415, "dur": 48.023, "args": { "External id": 15461,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650595389.207, "dur": 3.293, "args": { "External id": 15462,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650595389.752, "dur": 2.213, "args": { "External id": 15463,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650595391.006, "dur": 0.776, "args": { "External id": 15464,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650595393.151, "dur": 42.953, "args": { "External id": 15465,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650595395.251, "dur": 40.371, "args": { "External id": 15466,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650595440.167, "dur": 3.708, "args": { "External id": 15467,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650595442.087, "dur": 0.647, "args": { "External id": 15468,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650595458.935, "dur": 1.768, "args": { "External id": 15469,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650595468.184, "dur": 9.662, "args": { "External id": 15470,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650595471.693, "dur": 5.841, "args": { "External id": 15471,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650595560.802, "dur": 178.663, "args": { "External id": 15472,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650595563.154, "dur": 2.136, "args": { "External id": 15473,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650595566.478, "dur": 172.355, "args": { "External id": 15474,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650595575.123, "dur": 0.354, "args": { "External id": 15475,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650595578.414, "dur": 20.526, "args": { "External id": 15476,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650595600.762, "dur": 5.361, "args": { "External id": 15477,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650595603.106, "dur": 2.751, "args": { "External id": 15478,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650595608.765, "dur": 20.253, "args": { "External id": 15479,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650595609.422, "dur": 1.842, "args": { "External id": 15480,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650595612.517, "dur": 16.241, "args": { "External id": 15481,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650595615.112, "dur": 2.738, "args": { "External id": 15482,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650595630.452, "dur": 19.904, "args": { "External id": 15483,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650595651.364, "dur": 12.605, "args": { "External id": 15484,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650595666.285, "dur": 12.625, "args": { "External id": 15485,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650595680.005, "dur": 11.171, "args": { "External id": 15486,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650595692.890, "dur": 21.041, "args": { "External id": 15487,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650595696.235, "dur": 1.635, "args": { "External id": 15488,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650595699.753, "dur": 2.246, "args": { "External id": 15489,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650595715.196, "dur": 11.318, "args": { "External id": 15490,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650595727.412, "dur": 10.397, "args": { "External id": 15491,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650595745.735, "dur": 1.429, "args": { "External id": 15492,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650595755.403, "dur": 3.271, "args": { "External id": 15493,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650595757.547, "dur": 0.439, "args": { "External id": 15494,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650595820.181, "dur": 47.305, "args": { "External id": 15495,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650595873.779, "dur": 4.216, "args": { "External id": 15496,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650595876.142, "dur": 0.703, "args": { "External id": 15497,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650595879.323, "dur": 21.609, "args": { "External id": 15498,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650595904.779, "dur": 4.509, "args": { "External id": 15499,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650595905.840, "dur": 2.856, "args": { "External id": 15500,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650595907.442, "dur": 1.046, "args": { "External id": 15501,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650595913.045, "dur": 38.038, "args": { "External id": 15502,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650595914.023, "dur": 36.482, "args": { "External id": 15503,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650595954.966, "dur": 12.896, "args": { "External id": 15504,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650595972.975, "dur": 3.145, "args": { "External id": 15505,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650595974.787, "dur": 0.613, "args": { "External id": 15506,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650595979.616, "dur": 91.153, "args": { "External id": 15507,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650595980.134, "dur": 42.253, "args": { "External id": 15508,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650595982.280, "dur": 39.112, "args": { "External id": 15509,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650595983.601, "dur": 37.195, "args": { "External id": 15510,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650596023.771, "dur": 46.428, "args": { "External id": 15511,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650596024.582, "dur": 45.039, "args": { "External id": 15512,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650596075.933, "dur": 4.156, "args": { "External id": 15513,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650596078.109, "dur": 0.817, "args": { "External id": 15514,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650596086.613, "dur": 1.540, "args": { "External id": 15515,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650596096.827, "dur": 7.017, "args": { "External id": 15516,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650596098.708, "dur": 4.802, "args": { "External id": 15517,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650596183.661, "dur": 189.898, "args": { "External id": 15518,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650596187.890, "dur": 2.489, "args": { "External id": 15519,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650596191.716, "dur": 181.293, "args": { "External id": 15520,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9015 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650596193.192, "dur": 0.266, "args": { "External id": 15521,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650596194.504, "dur": 20.308, "args": { "External id": 15522,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650596216.118, "dur": 5.017, "args": { "External id": 15523,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9018 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650596220.033, "dur": 0.816, "args": { "External id": 15524,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650596222.398, "dur": 37.405, "args": { "External id": 15525,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650596223.335, "dur": 1.555, "args": { "External id": 15526,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650596225.854, "dur": 33.558, "args": { "External id": 15527,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650596243.122, "dur": 3.543, "args": { "External id": 15528,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650596261.120, "dur": 21.021, "args": { "External id": 15529,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650596283.214, "dur": 12.645, "args": { "External id": 15530,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650596298.188, "dur": 13.057, "args": { "External id": 15531,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650596312.516, "dur": 11.602, "args": { "External id": 15532,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650596325.843, "dur": 22.070, "args": { "External id": 15533,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650596331.032, "dur": 1.581, "args": { "External id": 15534,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650596334.751, "dur": 0.573, "args": { "External id": 15535,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650596349.339, "dur": 10.865, "args": { "External id": 15536,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650596360.987, "dur": 11.167, "args": { "External id": 15537,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650596380.117, "dur": 2.074, "args": { "External id": 15538,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650596391.105, "dur": 3.951, "args": { "External id": 15539,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650596393.663, "dur": 0.628, "args": { "External id": 15540,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650596460.042, "dur": 51.259, "args": { "External id": 15541,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650596516.167, "dur": 4.265, "args": { "External id": 15542,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650596518.638, "dur": 0.704, "args": { "External id": 15543,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650596521.760, "dur": 23.051, "args": { "External id": 15544,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650596548.912, "dur": 7.582, "args": { "External id": 15545,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650596550.430, "dur": 5.438, "args": { "External id": 15546,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650596554.165, "dur": 1.548, "args": { "External id": 15547,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650596558.960, "dur": 39.240, "args": { "External id": 15548,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650596560.134, "dur": 37.438, "args": { "External id": 15549,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650596601.537, "dur": 12.865, "args": { "External id": 15550,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650596619.646, "dur": 3.799, "args": { "External id": 15551,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650596622.012, "dur": 0.690, "args": { "External id": 15552,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650596626.691, "dur": 46.676, "args": { "External id": 15553,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650596628.851, "dur": 3.770, "args": { "External id": 15554,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650596629.675, "dur": 2.406, "args": { "External id": 15555,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650596631.151, "dur": 0.784, "args": { "External id": 15556,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650596633.224, "dur": 39.776, "args": { "External id": 15557,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650596634.029, "dur": 38.429, "args": { "External id": 15558,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650596676.765, "dur": 3.126, "args": { "External id": 15559,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650596678.299, "dur": 0.553, "args": { "External id": 15560,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650596686.978, "dur": 1.349, "args": { "External id": 15561,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650596695.304, "dur": 6.392, "args": { "External id": 15562,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650596697.201, "dur": 4.239, "args": { "External id": 15563,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650596775.218, "dur": 167.935, "args": { "External id": 15564,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650596779.364, "dur": 2.710, "args": { "External id": 15565,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650596785.620, "dur": 156.974, "args": { "External id": 15566,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650596786.486, "dur": 0.374, "args": { "External id": 15567,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650596787.927, "dur": 20.732, "args": { "External id": 15568,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650596809.974, "dur": 4.963, "args": { "External id": 15569,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650596814.072, "dur": 0.649, "args": { "External id": 15570,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650596815.562, "dur": 19.041, "args": { "External id": 15571,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650596816.499, "dur": 1.489, "args": { "External id": 15572,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650596818.968, "dur": 15.375, "args": { "External id": 15573,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650596821.208, "dur": 2.324, "args": { "External id": 15574,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650596837.275, "dur": 17.561, "args": { "External id": 15575,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650596855.873, "dur": 13.868, "args": { "External id": 15576,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650596871.828, "dur": 12.443, "args": { "External id": 15577,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650596885.260, "dur": 11.216, "args": { "External id": 15578,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650596897.839, "dur": 18.155, "args": { "External id": 15579,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650596899.850, "dur": 1.571, "args": { "External id": 15580,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650596903.110, "dur": 0.689, "args": { "External id": 15581,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650596918.794, "dur": 10.709, "args": { "External id": 15582,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650596930.287, "dur": 11.260, "args": { "External id": 15583,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650596948.498, "dur": 1.751, "args": { "External id": 15584,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650596957.662, "dur": 2.812, "args": { "External id": 15585,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650596959.454, "dur": 0.332, "args": { "External id": 15586,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650597064.848, "dur": 54.531, "args": { "External id": 15587,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650597124.446, "dur": 5.644, "args": { "External id": 15588,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650597127.684, "dur": 0.797, "args": { "External id": 15589,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650597131.666, "dur": 21.281, "args": { "External id": 15590,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650597159.564, "dur": 5.480, "args": { "External id": 15591,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650597161.189, "dur": 3.279, "args": { "External id": 15592,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650597163.067, "dur": 1.201, "args": { "External id": 15593,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650597167.798, "dur": 39.744, "args": { "External id": 15594,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650597168.938, "dur": 38.015, "args": { "External id": 15595,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650597211.308, "dur": 14.875, "args": { "External id": 15596,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650597247.198, "dur": 31.541, "args": { "External id": 15597,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650597251.978, "dur": 26.335, "args": { "External id": 15598,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650597258.128, "dur": 2.485, "args": { "External id": 15599,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650597284.956, "dur": 27.254, "args": { "External id": 15600,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650597286.866, "dur": 24.970, "args": { "External id": 15601,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], [], []], "Ev Idx": 9096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650597291.397, "dur": 4.094, "args": { "External id": 15602,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650597296.706, "dur": 14.683, "args": { "External id": 15603,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1336759, "ts": 1295650597326.745, "dur": 5.621, "args": { "External id": 15604,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9099 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1336759, "ts": 1295650597328.970, "dur": 3.088, "args": { "External id": 15605,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1336759, "ts": 1295650597333.497, "dur": 2.997, "args": { "External id": 15606,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9101 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1336759, "ts": 1295650597335.870, "dur": 0.512, "args": { "External id": 15607,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650597375.151, "dur": 21.669, "args": { "External id": 15608,"Sequence number": 246745, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 9103 } }, { "ph": "s", "id": 23, "pid": 1336759, "tid": 1336759, "ts": 1295650597375.151, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650597403.390, "dur": 6.172, "args": { "External id": 15609,"Sequence number": 246746, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 9104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650597407.087, "dur": 1.030, "args": { "External id": 15610,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336759, "tid": 1336759, "ts": 1295650597412.383, "dur": 6.353, "args": { "External id": 15611,"Sequence number": 246746, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "1"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 9106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650597416.539, "dur": 0.964, "args": { "External id": 15612,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "2"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650597421.702, "dur": 3.074, "args": { "External id": 15613,"Sequence number": 246746, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 9108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650597423.363, "dur": 0.840, "args": { "External id": 15614,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "2"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 9109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650597429.126, "dur": 5.777, "args": { "External id": 15615,"Sequence number": 246746, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9110 } }, { "ph": "s", "id": 22, "pid": 1336759, "tid": 1336759, "ts": 1295650597429.126, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650597432.371, "dur": 1.102, "args": { "External id": 15616,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650597436.016, "dur": 6.405, "args": { "External id": 15617,"Sequence number": 246747, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9112 } }, { "ph": "s", "id": 21, "pid": 1336759, "tid": 1336759, "ts": 1295650597436.016, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650597440.972, "dur": 0.703, "args": { "External id": 15618,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336759, "tid": 1336759, "ts": 1295650597443.443, "dur": 5.146, "args": { "External id": 15619,"Sequence number": 246748, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 9114 } }, { "ph": "s", "id": 20, "pid": 1336759, "tid": 1336759, "ts": 1295650597443.443, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650597447.035, "dur": 0.773, "args": { "External id": 15620,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650597449.779, "dur": 4.520, "args": { "External id": 15621,"Sequence number": 246749, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 9116 } }, { "ph": "s", "id": 19, "pid": 1336759, "tid": 1336759, "ts": 1295650597449.779, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650597452.501, "dur": 1.120, "args": { "External id": 15622,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 9117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336759, "tid": 1336759, "ts": 1295650597458.323, "dur": 32.415, "args": { "External id": 15623,"Sequence number": 246750, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1336759, "ts": 1295650597460.344, "dur": 30.175, "args": { "External id": 15624,"Sequence number": 246750, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650597462.860, "dur": 8.967, "args": { "External id": 15625,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 9120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650597468.222, "dur": 3.043, "args": { "External id": 15626,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650597472.825, "dur": 17.234, "args": { "External id": 15627,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 9122 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650597515.184, "dur": 3.677, "args": { "External id": 15628,"Sequence number": 246750, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 9123 } }, { "ph": "s", "id": 18, "pid": 1336759, "tid": 1336759, "ts": 1295650597515.184, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650597521.171, "dur": 1.402, "args": { "External id": 15629,"Sequence number": 246751, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9124 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650597553.822, "dur": 42137.029, "args": { "External id": 15630,"Sequence number": 246751, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [1], [2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536], [32000, 2048], [], [], [], [], []], "Ev Idx": 9125 } }, { "ph": "s", "id": 17, "pid": 1336759, "tid": 1336759, "ts": 1295650597553.822, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336759, "tid": 1336759, "ts": 1295650597567.878, "dur": 24.727, "args": { "External id": 15631,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1336759, "ts": 1295650597568.609, "dur": 23.754, "args": { "External id": 15632,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650597569.724, "dur": 7.183, "args": { "External id": 15633,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650597573.268, "dur": 3.299, "args": { "External id": 15634,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650597577.601, "dur": 14.390, "args": { "External id": 15635,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [8192, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 9130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336759, "tid": 1336759, "ts": 1295650597608.963, "dur": 26.852, "args": { "External id": 15636,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650597610.154, "dur": 5.327, "args": { "External id": 15637,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650597611.777, "dur": 3.411, "args": { "External id": 15638,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1336759, "ts": 1295650597617.487, "dur": 18.102, "args": { "External id": 15639,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650597619.827, "dur": 15.349, "args": { "External id": 15640,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336759, "tid": 1336759, "ts": 1295650597639.259, "dur": 19.792, "args": { "External id": 15641,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650597639.804, "dur": 4.506, "args": { "External id": 15642,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650597641.041, "dur": 3.030, "args": { "External id": 15643,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1336759, "ts": 1295650597644.953, "dur": 13.889, "args": { "External id": 15644,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650597647.490, "dur": 10.801, "args": { "External id": 15645,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[32000, 2048], []], "Ev Idx": 9140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1336759, "ts": 1295650597664.262, "dur": 15.213, "args": { "External id": 15646,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 9141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650597666.049, "dur": 2.751, "args": { "External id": 15647,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1336759, "ts": 1295650597669.570, "dur": 9.647, "args": { "External id": 15648,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 9143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650597670.316, "dur": 8.606, "args": { "External id": 15649,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336759, "tid": 1336759, "ts": 1295650597684.144, "dur": 22.669, "args": { "External id": 15650,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650597709.798, "dur": 61.546, "args": { "External id": 15651,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650597726.092, "dur": 44.889, "args": { "External id": 15652,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650597730.527, "dur": 2.465, "args": { "External id": 15653,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650597734.525, "dur": 22.191, "args": { "External id": 15654,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650597737.849, "dur": 18.669, "args": { "External id": 15655,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 9150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650597740.031, "dur": 2.877, "args": { "External id": 15656,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650597743.923, "dur": 12.194, "args": { "External id": 15657,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 9152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336759, "tid": 1336759, "ts": 1295650597774.770, "dur": 36517.955, "args": { "External id": 15658,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336759, "tid": 1336759, "ts": 1295650597776.359, "dur": 36513.601, "args": { "External id": 15659,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650634308.986, "dur": 8.676, "args": { "External id": 15660,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650634314.174, "dur": 1.395, "args": { "External id": 15661,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650634323.043, "dur": 102.149, "args": { "External id": 15662,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650634326.271, "dur": 6.129, "args": { "External id": 15663,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650634328.464, "dur": 3.197, "args": { "External id": 15664,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650634330.464, "dur": 0.944, "args": { "External id": 15665,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650634333.746, "dur": 90.782, "args": { "External id": 15666,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650634335.429, "dur": 88.349, "args": { "External id": 15667,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650634428.834, "dur": 3.778, "args": { "External id": 15668,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650634430.835, "dur": 0.600, "args": { "External id": 15669,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650634442.164, "dur": 2.497, "args": { "External id": 15670,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650634453.899, "dur": 7.266, "args": { "External id": 15671,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650634456.179, "dur": 4.678, "args": { "External id": 15672,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650634589.438, "dur": 195.311, "args": { "External id": 15673,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650634594.016, "dur": 2.488, "args": { "External id": 15674,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650634598.072, "dur": 185.907, "args": { "External id": 15675,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650634601.151, "dur": 0.538, "args": { "External id": 15676,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650634603.378, "dur": 25.840, "args": { "External id": 15677,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650634630.989, "dur": 5.224, "args": { "External id": 15678,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650634635.038, "dur": 0.878, "args": { "External id": 15679,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650634637.261, "dur": 22.786, "args": { "External id": 15680,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9175 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650634638.301, "dur": 2.068, "args": { "External id": 15681,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9176 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650634641.778, "dur": 18.014, "args": { "External id": 15682,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650634645.626, "dur": 3.180, "args": { "External id": 15683,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650634662.085, "dur": 22.578, "args": { "External id": 15684,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650634686.596, "dur": 13.345, "args": { "External id": 15685,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650634704.553, "dur": 15.004, "args": { "External id": 15686,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650634721.178, "dur": 11.961, "args": { "External id": 15687,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650634735.103, "dur": 21.263, "args": { "External id": 15688,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650634739.061, "dur": 1.649, "args": { "External id": 15689,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650634743.014, "dur": 0.848, "args": { "External id": 15690,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650634757.806, "dur": 11.595, "args": { "External id": 15691,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650634772.522, "dur": 10.439, "args": { "External id": 15692,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650634791.423, "dur": 1.877, "args": { "External id": 15693,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650634799.555, "dur": 3.876, "args": { "External id": 15694,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650634802.019, "dur": 0.607, "args": { "External id": 15695,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650634870.484, "dur": 58.645, "args": { "External id": 15696,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650634934.048, "dur": 5.036, "args": { "External id": 15697,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650634936.373, "dur": 0.696, "args": { "External id": 15698,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650634940.913, "dur": 29.713, "args": { "External id": 15699,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650634977.027, "dur": 41.301, "args": { "External id": 15700,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650634978.567, "dur": 38.719, "args": { "External id": 15701,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650634980.615, "dur": 35.936, "args": { "External id": 15702,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650635022.864, "dur": 49.835, "args": { "External id": 15703,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650635024.176, "dur": 47.815, "args": { "External id": 15704,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650635077.545, "dur": 16.057, "args": { "External id": 15705,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650635100.252, "dur": 5.992, "args": { "External id": 15706,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650635104.606, "dur": 0.752, "args": { "External id": 15707,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650635110.594, "dur": 53.905, "args": { "External id": 15708,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650635111.494, "dur": 4.260, "args": { "External id": 15709,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650635112.539, "dur": 2.722, "args": { "External id": 15710,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650635114.074, "dur": 1.025, "args": { "External id": 15711,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650635116.420, "dur": 47.594, "args": { "External id": 15712,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650635123.207, "dur": 40.257, "args": { "External id": 15713,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650635168.773, "dur": 3.490, "args": { "External id": 15714,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650635170.702, "dur": 0.583, "args": { "External id": 15715,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650635178.769, "dur": 1.755, "args": { "External id": 15716,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650635188.363, "dur": 9.798, "args": { "External id": 15717,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650635192.331, "dur": 5.487, "args": { "External id": 15718,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650635307.887, "dur": 180.310, "args": { "External id": 15719,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650635310.444, "dur": 2.842, "args": { "External id": 15720,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650635315.129, "dur": 172.541, "args": { "External id": 15721,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650635316.828, "dur": 0.380, "args": { "External id": 15722,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650635318.278, "dur": 23.220, "args": { "External id": 15723,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650635346.983, "dur": 3.308, "args": { "External id": 15724,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650635349.273, "dur": 0.720, "args": { "External id": 15725,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650635352.793, "dur": 22.583, "args": { "External id": 15726,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650635353.806, "dur": 3.173, "args": { "External id": 15727,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650635358.205, "dur": 16.877, "args": { "External id": 15728,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650635360.864, "dur": 3.095, "args": { "External id": 15729,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650635377.039, "dur": 19.885, "args": { "External id": 15730,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650635398.336, "dur": 13.872, "args": { "External id": 15731,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650635415.278, "dur": 13.217, "args": { "External id": 15732,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650635429.835, "dur": 11.416, "args": { "External id": 15733,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650635443.051, "dur": 19.880, "args": { "External id": 15734,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650635446.319, "dur": 1.700, "args": { "External id": 15735,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650635450.036, "dur": 0.640, "args": { "External id": 15736,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650635464.451, "dur": 10.905, "args": { "External id": 15737,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650635476.354, "dur": 10.275, "args": { "External id": 15738,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650635494.756, "dur": 2.187, "args": { "External id": 15739,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650635505.862, "dur": 3.505, "args": { "External id": 15740,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650635508.202, "dur": 0.456, "args": { "External id": 15741,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650635573.648, "dur": 50.946, "args": { "External id": 15742,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650635630.813, "dur": 4.387, "args": { "External id": 15743,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650635633.135, "dur": 0.942, "args": { "External id": 15744,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650635636.633, "dur": 22.462, "args": { "External id": 15745,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650635663.124, "dur": 6.211, "args": { "External id": 15746,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650635664.346, "dur": 4.362, "args": { "External id": 15747,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650635666.241, "dur": 2.230, "args": { "External id": 15748,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650635672.997, "dur": 38.501, "args": { "External id": 15749,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650635674.206, "dur": 36.723, "args": { "External id": 15750,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650635715.525, "dur": 13.362, "args": { "External id": 15751,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650635734.332, "dur": 3.420, "args": { "External id": 15752,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650635736.247, "dur": 0.616, "args": { "External id": 15753,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650635741.492, "dur": 47.149, "args": { "External id": 15754,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650635742.384, "dur": 5.090, "args": { "External id": 15755,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650635744.919, "dur": 2.093, "args": { "External id": 15756,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650635746.161, "dur": 0.716, "args": { "External id": 15757,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650635748.200, "dur": 40.102, "args": { "External id": 15758,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650635748.869, "dur": 38.945, "args": { "External id": 15759,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650635792.815, "dur": 3.191, "args": { "External id": 15760,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650635794.493, "dur": 0.496, "args": { "External id": 15761,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650635801.296, "dur": 1.216, "args": { "External id": 15762,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650635810.942, "dur": 5.434, "args": { "External id": 15763,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650635812.665, "dur": 3.428, "args": { "External id": 15764,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650635896.551, "dur": 215.569, "args": { "External id": 15765,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650635904.518, "dur": 1.903, "args": { "External id": 15766,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650635909.378, "dur": 202.138, "args": { "External id": 15767,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650635910.304, "dur": 0.371, "args": { "External id": 15768,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650635911.871, "dur": 18.279, "args": { "External id": 15769,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650635931.715, "dur": 4.720, "args": { "External id": 15770,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650635933.846, "dur": 2.397, "args": { "External id": 15771,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650635938.634, "dur": 18.091, "args": { "External id": 15772,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650635939.486, "dur": 1.421, "args": { "External id": 15773,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650635941.878, "dur": 14.525, "args": { "External id": 15774,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650635943.972, "dur": 2.300, "args": { "External id": 15775,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650635957.800, "dur": 19.472, "args": { "External id": 15776,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650635978.389, "dur": 52.989, "args": { "External id": 15777,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650636035.247, "dur": 14.727, "args": { "External id": 15778,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650636051.408, "dur": 11.364, "args": { "External id": 15779,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650636064.616, "dur": 21.754, "args": { "External id": 15780,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650636069.514, "dur": 1.613, "args": { "External id": 15781,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650636072.849, "dur": 0.811, "args": { "External id": 15782,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650636087.640, "dur": 11.459, "args": { "External id": 15783,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650636100.158, "dur": 10.382, "args": { "External id": 15784,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650636119.691, "dur": 2.045, "args": { "External id": 15785,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650636130.767, "dur": 3.590, "args": { "External id": 15786,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650636132.968, "dur": 0.559, "args": { "External id": 15787,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650636199.743, "dur": 74.314, "args": { "External id": 15788,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650636280.499, "dur": 7.115, "args": { "External id": 15789,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650636283.314, "dur": 2.663, "args": { "External id": 15790,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650636289.002, "dur": 25.346, "args": { "External id": 15791,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650636319.570, "dur": 5.897, "args": { "External id": 15792,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650636320.806, "dur": 4.125, "args": { "External id": 15793,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650636323.667, "dur": 1.096, "args": { "External id": 15794,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650636328.153, "dur": 72.674, "args": { "External id": 15795,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650636329.185, "dur": 70.939, "args": { "External id": 15796,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650636404.838, "dur": 35.617, "args": { "External id": 15797,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650636446.403, "dur": 3.804, "args": { "External id": 15798,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650636448.426, "dur": 0.876, "args": { "External id": 15799,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650636453.837, "dur": 59.318, "args": { "External id": 15800,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650636456.322, "dur": 3.145, "args": { "External id": 15801,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650636456.994, "dur": 2.073, "args": { "External id": 15802,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650636458.264, "dur": 0.565, "args": { "External id": 15803,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650636460.377, "dur": 52.302, "args": { "External id": 15804,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650636460.869, "dur": 51.278, "args": { "External id": 15805,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650636516.805, "dur": 3.614, "args": { "External id": 15806,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650636518.747, "dur": 0.626, "args": { "External id": 15807,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650636527.650, "dur": 1.542, "args": { "External id": 15808,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650636537.132, "dur": 6.113, "args": { "External id": 15809,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650636538.824, "dur": 4.151, "args": { "External id": 15810,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650636630.360, "dur": 172.237, "args": { "External id": 15811,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650636632.557, "dur": 3.759, "args": { "External id": 15812,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650636639.516, "dur": 162.452, "args": { "External id": 15813,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650636640.901, "dur": 0.558, "args": { "External id": 15814,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650636642.401, "dur": 20.568, "args": { "External id": 15815,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650636664.605, "dur": 4.941, "args": { "External id": 15816,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650636668.407, "dur": 0.898, "args": { "External id": 15817,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650636670.523, "dur": 19.484, "args": { "External id": 15818,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650636671.607, "dur": 1.530, "args": { "External id": 15819,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650636674.195, "dur": 15.542, "args": { "External id": 15820,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650636676.689, "dur": 2.628, "args": { "External id": 15821,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650636693.093, "dur": 19.774, "args": { "External id": 15822,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650636714.001, "dur": 12.634, "args": { "External id": 15823,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650636729.224, "dur": 12.135, "args": { "External id": 15824,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650636742.543, "dur": 11.449, "args": { "External id": 15825,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650636755.496, "dur": 19.930, "args": { "External id": 15826,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650636757.308, "dur": 1.788, "args": { "External id": 15827,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650636760.926, "dur": 2.488, "args": { "External id": 15828,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650636778.219, "dur": 11.246, "args": { "External id": 15829,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650636790.505, "dur": 10.424, "args": { "External id": 15830,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650636808.563, "dur": 1.810, "args": { "External id": 15831,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650636817.822, "dur": 3.212, "args": { "External id": 15832,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650636819.802, "dur": 0.407, "args": { "External id": 15833,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650636881.836, "dur": 46.158, "args": { "External id": 15834,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650636932.363, "dur": 4.420, "args": { "External id": 15835,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650636934.856, "dur": 0.794, "args": { "External id": 15836,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650636938.131, "dur": 22.605, "args": { "External id": 15837,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650636966.567, "dur": 4.816, "args": { "External id": 15838,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650636967.641, "dur": 3.011, "args": { "External id": 15839,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650636969.243, "dur": 1.221, "args": { "External id": 15840,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650636973.541, "dur": 83.099, "args": { "External id": 15841,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650636974.231, "dur": 81.325, "args": { "External id": 15842,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650637062.318, "dur": 14.750, "args": { "External id": 15843,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650637083.260, "dur": 6.082, "args": { "External id": 15844,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650637087.389, "dur": 0.962, "args": { "External id": 15845,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650637093.213, "dur": 48.867, "args": { "External id": 15846,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650637094.195, "dur": 3.338, "args": { "External id": 15847,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650637095.058, "dur": 1.955, "args": { "External id": 15848,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650637096.251, "dur": 0.625, "args": { "External id": 15849,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650637098.337, "dur": 43.369, "args": { "External id": 15850,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650637100.962, "dur": 40.086, "args": { "External id": 15851,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650637146.141, "dur": 3.991, "args": { "External id": 15852,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650637148.107, "dur": 0.951, "args": { "External id": 15853,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650637156.983, "dur": 1.554, "args": { "External id": 15854,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650637165.970, "dur": 6.564, "args": { "External id": 15855,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650637167.715, "dur": 4.555, "args": { "External id": 15856,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650637275.342, "dur": 207.829, "args": { "External id": 15857,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650637279.623, "dur": 2.982, "args": { "External id": 15858,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650637284.163, "dur": 198.210, "args": { "External id": 15859,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650637285.434, "dur": 0.447, "args": { "External id": 15860,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650637286.639, "dur": 20.397, "args": { "External id": 15861,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650637308.460, "dur": 4.655, "args": { "External id": 15862,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650637312.025, "dur": 0.811, "args": { "External id": 15863,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650637313.855, "dur": 20.952, "args": { "External id": 15864,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650637315.325, "dur": 1.482, "args": { "External id": 15865,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650637317.877, "dur": 16.646, "args": { "External id": 15866,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650637320.481, "dur": 2.977, "args": { "External id": 15867,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650637337.820, "dur": 20.133, "args": { "External id": 15868,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650637359.040, "dur": 12.273, "args": { "External id": 15869,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650637373.825, "dur": 13.710, "args": { "External id": 15870,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650637388.891, "dur": 11.088, "args": { "External id": 15871,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650637401.905, "dur": 53.762, "args": { "External id": 15872,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650637438.359, "dur": 1.900, "args": { "External id": 15873,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650637442.739, "dur": 0.587, "args": { "External id": 15874,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650637459.000, "dur": 10.792, "args": { "External id": 15875,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650637470.751, "dur": 10.635, "args": { "External id": 15876,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650637490.266, "dur": 2.019, "args": { "External id": 15877,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650637501.734, "dur": 3.707, "args": { "External id": 15878,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650637504.119, "dur": 0.514, "args": { "External id": 15879,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650637569.258, "dur": 52.795, "args": { "External id": 15880,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650637626.532, "dur": 5.317, "args": { "External id": 15881,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650637630.006, "dur": 0.820, "args": { "External id": 15882,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650637633.301, "dur": 24.057, "args": { "External id": 15883,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650637661.601, "dur": 4.819, "args": { "External id": 15884,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650637662.701, "dur": 3.192, "args": { "External id": 15885,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650637664.504, "dur": 1.207, "args": { "External id": 15886,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650637668.738, "dur": 37.668, "args": { "External id": 15887,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650637669.768, "dur": 35.990, "args": { "External id": 15888,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650637712.179, "dur": 13.394, "args": { "External id": 15889,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650637730.522, "dur": 3.399, "args": { "External id": 15890,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650637732.238, "dur": 0.805, "args": { "External id": 15891,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650637737.535, "dur": 46.644, "args": { "External id": 15892,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650637738.287, "dur": 5.344, "args": { "External id": 15893,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650637739.044, "dur": 4.130, "args": { "External id": 15894,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650637741.864, "dur": 1.160, "args": { "External id": 15895,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650637744.173, "dur": 39.626, "args": { "External id": 15896,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650637744.555, "dur": 38.805, "args": { "External id": 15897,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650637787.721, "dur": 3.507, "args": { "External id": 15898,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650637789.328, "dur": 0.892, "args": { "External id": 15899,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650637796.709, "dur": 1.363, "args": { "External id": 15900,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650637806.887, "dur": 5.489, "args": { "External id": 15901,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650637808.631, "dur": 3.426, "args": { "External id": 15902,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650637886.747, "dur": 213.962, "args": { "External id": 15903,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650637890.588, "dur": 2.043, "args": { "External id": 15904,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650637893.804, "dur": 206.248, "args": { "External id": 15905,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650637894.906, "dur": 0.369, "args": { "External id": 15906,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650637896.161, "dur": 18.837, "args": { "External id": 15907,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650637918.193, "dur": 4.634, "args": { "External id": 15908,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650637921.710, "dur": 0.923, "args": { "External id": 15909,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650637923.709, "dur": 18.670, "args": { "External id": 15910,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650637924.415, "dur": 1.354, "args": { "External id": 15911,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650637926.887, "dur": 15.232, "args": { "External id": 15912,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650637929.103, "dur": 2.003, "args": { "External id": 15913,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650637943.536, "dur": 25.302, "args": { "External id": 15914,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650637969.946, "dur": 12.596, "args": { "External id": 15915,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650638021.532, "dur": 16.589, "args": { "External id": 15916,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650638039.521, "dur": 11.760, "args": { "External id": 15917,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650638054.993, "dur": 19.502, "args": { "External id": 15918,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650638056.977, "dur": 1.737, "args": { "External id": 15919,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650638060.828, "dur": 0.785, "args": { "External id": 15920,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650638076.146, "dur": 10.930, "args": { "External id": 15921,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650638088.000, "dur": 10.882, "args": { "External id": 15922,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650638108.270, "dur": 2.133, "args": { "External id": 15923,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650638119.469, "dur": 3.854, "args": { "External id": 15924,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650638122.204, "dur": 0.437, "args": { "External id": 15925,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650638190.393, "dur": 72.210, "args": { "External id": 15926,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650638268.834, "dur": 4.950, "args": { "External id": 15927,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650638271.535, "dur": 0.978, "args": { "External id": 15928,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650638275.194, "dur": 23.571, "args": { "External id": 15929,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650638303.771, "dur": 7.207, "args": { "External id": 15930,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650638305.271, "dur": 5.013, "args": { "External id": 15931,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650638308.742, "dur": 1.346, "args": { "External id": 15932,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650638313.630, "dur": 42.190, "args": { "External id": 15933,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650638314.766, "dur": 40.553, "args": { "External id": 15934,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650638359.713, "dur": 14.201, "args": { "External id": 15935,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650638379.722, "dur": 3.600, "args": { "External id": 15936,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650638381.681, "dur": 0.895, "args": { "External id": 15937,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650638386.968, "dur": 45.544, "args": { "External id": 15938,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650638389.620, "dur": 3.368, "args": { "External id": 15939,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650638390.306, "dur": 2.175, "args": { "External id": 15940,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650638391.623, "dur": 0.731, "args": { "External id": 15941,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650638393.527, "dur": 38.613, "args": { "External id": 15942,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650638394.105, "dur": 37.544, "args": { "External id": 15943,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650638436.472, "dur": 4.975, "args": { "External id": 15944,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650638438.200, "dur": 2.101, "args": { "External id": 15945,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650638447.273, "dur": 1.448, "args": { "External id": 15946,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650638457.520, "dur": 6.313, "args": { "External id": 15947,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650638459.417, "dur": 4.129, "args": { "External id": 15948,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650638541.637, "dur": 172.681, "args": { "External id": 15949,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650638543.916, "dur": 2.051, "args": { "External id": 15950,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650638547.240, "dur": 166.650, "args": { "External id": 15951,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650638548.412, "dur": 0.441, "args": { "External id": 15952,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650638551.818, "dur": 20.432, "args": { "External id": 15953,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650638574.072, "dur": 3.312, "args": { "External id": 15954,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650638576.268, "dur": 0.840, "args": { "External id": 15955,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650638584.929, "dur": 21.197, "args": { "External id": 15956,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650638585.763, "dur": 2.807, "args": { "External id": 15957,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650638589.956, "dur": 15.851, "args": { "External id": 15958,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650638592.421, "dur": 2.741, "args": { "External id": 15959,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650638607.475, "dur": 19.250, "args": { "External id": 15960,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650638627.888, "dur": 11.899, "args": { "External id": 15961,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650638641.924, "dur": 12.817, "args": { "External id": 15962,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650638657.374, "dur": 11.032, "args": { "External id": 15963,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650638669.932, "dur": 17.783, "args": { "External id": 15964,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650638671.877, "dur": 1.655, "args": { "External id": 15965,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650638675.111, "dur": 0.860, "args": { "External id": 15966,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650638688.919, "dur": 10.664, "args": { "External id": 15967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650638700.400, "dur": 10.529, "args": { "External id": 15968,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650638720.010, "dur": 1.475, "args": { "External id": 15969,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650638728.655, "dur": 2.858, "args": { "External id": 15970,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650638730.452, "dur": 0.396, "args": { "External id": 15971,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650638786.747, "dur": 44.804, "args": { "External id": 15972,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650638835.700, "dur": 4.166, "args": { "External id": 15973,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650638838.026, "dur": 0.781, "args": { "External id": 15974,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650638844.598, "dur": 21.262, "args": { "External id": 15975,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650638871.534, "dur": 5.675, "args": { "External id": 15976,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650638872.358, "dur": 4.313, "args": { "External id": 15977,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650638873.931, "dur": 2.536, "args": { "External id": 15978,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9473 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650638879.294, "dur": 38.101, "args": { "External id": 15979,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650638880.331, "dur": 36.524, "args": { "External id": 15980,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650638920.764, "dur": 13.071, "args": { "External id": 15981,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650638938.753, "dur": 5.008, "args": { "External id": 15982,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650638942.163, "dur": 0.791, "args": { "External id": 15983,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650638947.097, "dur": 82.496, "args": { "External id": 15984,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650638947.777, "dur": 3.411, "args": { "External id": 15985,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650638948.644, "dur": 1.958, "args": { "External id": 15986,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650638949.621, "dur": 0.843, "args": { "External id": 15987,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650638951.789, "dur": 77.308, "args": { "External id": 15988,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650638954.115, "dur": 73.773, "args": { "External id": 15989,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650639035.942, "dur": 4.587, "args": { "External id": 15990,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650639038.437, "dur": 0.894, "args": { "External id": 15991,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650639046.338, "dur": 1.558, "args": { "External id": 15992,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650639055.119, "dur": 8.634, "args": { "External id": 15993,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650639058.846, "dur": 4.642, "args": { "External id": 15994,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650639144.951, "dur": 190.731, "args": { "External id": 15995,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650639146.876, "dur": 2.197, "args": { "External id": 15996,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650639152.228, "dur": 183.034, "args": { "External id": 15997,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650639153.353, "dur": 0.573, "args": { "External id": 15998,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650639154.752, "dur": 21.513, "args": { "External id": 15999,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650639177.876, "dur": 5.308, "args": { "External id": 16000,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650639179.919, "dur": 2.965, "args": { "External id": 16001,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650639184.009, "dur": 22.015, "args": { "External id": 16002,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650639186.933, "dur": 1.706, "args": { "External id": 16003,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650639189.533, "dur": 16.170, "args": { "External id": 16004,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650639192.116, "dur": 2.542, "args": { "External id": 16005,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650639207.240, "dur": 18.964, "args": { "External id": 16006,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650639241.948, "dur": 15.556, "args": { "External id": 16007,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650639261.397, "dur": 13.082, "args": { "External id": 16008,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650639275.658, "dur": 11.945, "args": { "External id": 16009,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9504 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650639289.675, "dur": 20.418, "args": { "External id": 16010,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650639291.729, "dur": 1.682, "args": { "External id": 16011,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650639296.730, "dur": 0.699, "args": { "External id": 16012,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650639311.415, "dur": 11.097, "args": { "External id": 16013,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650639323.616, "dur": 10.478, "args": { "External id": 16014,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650639342.377, "dur": 2.068, "args": { "External id": 16015,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650639353.172, "dur": 3.348, "args": { "External id": 16016,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650639355.046, "dur": 0.561, "args": { "External id": 16017,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650639420.523, "dur": 58.223, "args": { "External id": 16018,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650639483.341, "dur": 7.250, "args": { "External id": 16019,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650639487.182, "dur": 2.264, "args": { "External id": 16020,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650639492.076, "dur": 23.628, "args": { "External id": 16021,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9516 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650639520.211, "dur": 4.873, "args": { "External id": 16022,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9517 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650639521.533, "dur": 2.921, "args": { "External id": 16023,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650639523.313, "dur": 0.889, "args": { "External id": 16024,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650639527.566, "dur": 44.230, "args": { "External id": 16025,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650639530.197, "dur": 40.955, "args": { "External id": 16026,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650639575.650, "dur": 14.095, "args": { "External id": 16027,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650639594.828, "dur": 20.860, "args": { "External id": 16028,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650639596.859, "dur": 18.474, "args": { "External id": 16029,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650639601.512, "dur": 0.867, "args": { "External id": 16030,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650639620.824, "dur": 24.649, "args": { "External id": 16031,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650639622.688, "dur": 22.560, "args": { "External id": 16032,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], [], []], "Ev Idx": 9527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650639626.728, "dur": 3.777, "args": { "External id": 16033,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650639631.803, "dur": 13.001, "args": { "External id": 16034,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1336759, "ts": 1295650639657.035, "dur": 6.831, "args": { "External id": 16035,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9530 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1336759, "ts": 1295650639661.013, "dur": 2.541, "args": { "External id": 16036,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1336759, "ts": 1295650639664.933, "dur": 1.185, "args": { "External id": 16037,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9532 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1336759, "ts": 1295650639665.447, "dur": 0.585, "args": { "External id": 16038,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650639704.796, "dur": 19.691, "args": { "External id": 16039,"Sequence number": 246752, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 9534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650639726.031, "dur": 12.736, "args": { "External id": 16040,"Sequence number": 246753, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 9535 } }, { "ph": "s", "id": 16, "pid": 1336759, "tid": 1336759, "ts": 1295650639726.031, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650639744.176, "dur": 5.548, "args": { "External id": 16041,"Sequence number": 246754, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 9536 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650639747.527, "dur": 1.021, "args": { "External id": 16042,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336759, "tid": 1336759, "ts": 1295650639753.793, "dur": 5.676, "args": { "External id": 16043,"Sequence number": 246754, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "2"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 9538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650639757.610, "dur": 0.843, "args": { "External id": 16044,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "3"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650639760.777, "dur": 2.657, "args": { "External id": 16045,"Sequence number": 246754, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 9540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650639762.133, "dur": 0.725, "args": { "External id": 16046,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "3"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 9541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650639767.481, "dur": 7.444, "args": { "External id": 16047,"Sequence number": 246754, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9542 } }, { "ph": "s", "id": 15, "pid": 1336759, "tid": 1336759, "ts": 1295650639767.481, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650639772.409, "dur": 1.008, "args": { "External id": 16048,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650639775.913, "dur": 4.645, "args": { "External id": 16049,"Sequence number": 246755, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9544 } }, { "ph": "s", "id": 14, "pid": 1336759, "tid": 1336759, "ts": 1295650639775.913, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650639779.049, "dur": 0.658, "args": { "External id": 16050,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336759, "tid": 1336759, "ts": 1295650639781.424, "dur": 6.940, "args": { "External id": 16051,"Sequence number": 246756, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "2"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 9546 } }, { "ph": "s", "id": 13, "pid": 1336759, "tid": 1336759, "ts": 1295650639781.424, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650639786.755, "dur": 0.718, "args": { "External id": 16052,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "4096"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650639789.382, "dur": 3.793, "args": { "External id": 16053,"Sequence number": 246757, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 9548 } }, { "ph": "s", "id": 12, "pid": 1336759, "tid": 1336759, "ts": 1295650639789.382, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650639791.737, "dur": 0.709, "args": { "External id": 16054,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "4096"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 9549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336759, "tid": 1336759, "ts": 1295650639796.562, "dur": 28.698, "args": { "External id": 16055,"Sequence number": 246758, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1336759, "ts": 1295650639798.358, "dur": 26.702, "args": { "External id": 16056,"Sequence number": 246758, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650639800.757, "dur": 5.493, "args": { "External id": 16057,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 9552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650639802.800, "dur": 2.826, "args": { "External id": 16058,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650639806.995, "dur": 17.636, "args": { "External id": 16059,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 9554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650639848.198, "dur": 3.586, "args": { "External id": 16060,"Sequence number": 246758, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 9555 } }, { "ph": "s", "id": 11, "pid": 1336759, "tid": 1336759, "ts": 1295650639848.198, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650639853.991, "dur": 2.704, "args": { "External id": 16061,"Sequence number": 246759, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9556 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650639889.613, "dur": 44487.530, "args": { "External id": 16062,"Sequence number": 246759, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [1], [2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536], [32000, 2048], [], [], [], [], []], "Ev Idx": 9557 } }, { "ph": "s", "id": 10, "pid": 1336759, "tid": 1336759, "ts": 1295650639889.613, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336759, "tid": 1336759, "ts": 1295650639906.555, "dur": 24.086, "args": { "External id": 16063,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1336759, "ts": 1295650639907.458, "dur": 22.923, "args": { "External id": 16064,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650639908.435, "dur": 4.826, "args": { "External id": 16065,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9560 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650639909.764, "dur": 3.125, "args": { "External id": 16066,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650639914.081, "dur": 15.859, "args": { "External id": 16067,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [8192, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 9562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336759, "tid": 1336759, "ts": 1295650639945.661, "dur": 24.280, "args": { "External id": 16068,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650639946.918, "dur": 5.638, "args": { "External id": 16069,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650639948.607, "dur": 3.677, "args": { "External id": 16070,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9565 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1336759, "ts": 1295650639954.046, "dur": 15.680, "args": { "External id": 16071,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650639955.654, "dur": 13.673, "args": { "External id": 16072,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336759, "tid": 1336759, "ts": 1295650639973.411, "dur": 60.703, "args": { "External id": 16073,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650639974.007, "dur": 6.013, "args": { "External id": 16074,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650639976.834, "dur": 2.980, "args": { "External id": 16075,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1336759, "ts": 1295650639980.659, "dur": 53.270, "args": { "External id": 16076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9571 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650639981.411, "dur": 51.745, "args": { "External id": 16077,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[32000, 2048], []], "Ev Idx": 9572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1336759, "ts": 1295650640041.871, "dur": 19.362, "args": { "External id": 16078,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 9573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650640043.611, "dur": 4.849, "args": { "External id": 16079,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1336759, "ts": 1295650640049.245, "dur": 11.731, "args": { "External id": 16080,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 9575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650640049.972, "dur": 10.673, "args": { "External id": 16081,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336759, "tid": 1336759, "ts": 1295650640067.740, "dur": 21.190, "args": { "External id": 16082,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650640091.335, "dur": 46.889, "args": { "External id": 16083,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650640093.266, "dur": 44.525, "args": { "External id": 16084,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650640098.054, "dur": 1.244, "args": { "External id": 16085,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650640100.533, "dur": 22.989, "args": { "External id": 16086,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650640102.202, "dur": 21.098, "args": { "External id": 16087,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 9582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650640105.960, "dur": 2.946, "args": { "External id": 16088,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650640109.764, "dur": 13.257, "args": { "External id": 16089,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 9584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336759, "tid": 1336759, "ts": 1295650640141.574, "dur": 38977.936, "args": { "External id": 16090,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336759, "tid": 1336759, "ts": 1295650640143.375, "dur": 38975.302, "args": { "External id": 16091,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650679129.585, "dur": 8.173, "args": { "External id": 16092,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650679135.065, "dur": 1.086, "args": { "External id": 16093,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650679142.450, "dur": 108.208, "args": { "External id": 16094,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650679143.776, "dur": 5.598, "args": { "External id": 16095,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650679145.757, "dur": 2.905, "args": { "External id": 16096,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650679147.564, "dur": 0.824, "args": { "External id": 16097,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650679150.631, "dur": 99.373, "args": { "External id": 16098,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650679154.194, "dur": 94.395, "args": { "External id": 16099,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650679255.356, "dur": 4.577, "args": { "External id": 16100,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650679257.775, "dur": 0.866, "args": { "External id": 16101,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650679266.924, "dur": 2.494, "args": { "External id": 16102,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650679277.864, "dur": 6.000, "args": { "External id": 16103,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650679279.741, "dur": 3.857, "args": { "External id": 16104,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650679400.143, "dur": 181.102, "args": { "External id": 16105,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650679403.029, "dur": 2.094, "args": { "External id": 16106,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650679406.431, "dur": 174.393, "args": { "External id": 16107,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650679410.265, "dur": 0.554, "args": { "External id": 16108,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650679412.271, "dur": 22.823, "args": { "External id": 16109,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650679436.511, "dur": 3.333, "args": { "External id": 16110,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650679438.687, "dur": 0.867, "args": { "External id": 16111,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650679440.765, "dur": 25.321, "args": { "External id": 16112,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650679444.032, "dur": 1.213, "args": { "External id": 16113,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650679448.186, "dur": 17.568, "args": { "External id": 16114,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650679451.622, "dur": 2.899, "args": { "External id": 16115,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650679467.831, "dur": 20.954, "args": { "External id": 16116,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650679490.286, "dur": 13.856, "args": { "External id": 16117,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650679506.883, "dur": 13.975, "args": { "External id": 16118,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650679522.098, "dur": 11.911, "args": { "External id": 16119,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650679535.878, "dur": 20.029, "args": { "External id": 16120,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650679537.793, "dur": 1.569, "args": { "External id": 16121,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650679542.920, "dur": 0.711, "args": { "External id": 16122,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650679557.306, "dur": 11.276, "args": { "External id": 16123,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650679569.884, "dur": 9.977, "args": { "External id": 16124,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650679588.069, "dur": 1.906, "args": { "External id": 16125,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650679596.254, "dur": 3.588, "args": { "External id": 16126,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650679598.192, "dur": 0.781, "args": { "External id": 16127,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650679663.912, "dur": 61.466, "args": { "External id": 16128,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650679730.418, "dur": 7.527, "args": { "External id": 16129,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650679735.198, "dur": 0.556, "args": { "External id": 16130,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650679739.420, "dur": 23.300, "args": { "External id": 16131,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650679767.692, "dur": 7.649, "args": { "External id": 16132,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650679769.283, "dur": 5.302, "args": { "External id": 16133,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650679771.635, "dur": 2.697, "args": { "External id": 16134,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650679778.503, "dur": 43.256, "args": { "External id": 16135,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650679781.375, "dur": 39.758, "args": { "External id": 16136,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650679825.773, "dur": 14.368, "args": { "External id": 16137,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650679845.531, "dur": 3.970, "args": { "External id": 16138,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650679847.527, "dur": 1.156, "args": { "External id": 16139,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650679853.767, "dur": 48.580, "args": { "External id": 16140,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650679854.622, "dur": 5.433, "args": { "External id": 16141,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650679855.417, "dur": 4.021, "args": { "External id": 16142,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650679858.729, "dur": 0.564, "args": { "External id": 16143,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650679860.759, "dur": 41.152, "args": { "External id": 16144,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650679861.332, "dur": 40.105, "args": { "External id": 16145,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650679906.159, "dur": 3.664, "args": { "External id": 16146,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650679908.077, "dur": 0.829, "args": { "External id": 16147,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9642 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650679915.102, "dur": 1.296, "args": { "External id": 16148,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650679925.476, "dur": 5.455, "args": { "External id": 16149,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650679927.103, "dur": 3.570, "args": { "External id": 16150,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650680057.097, "dur": 193.722, "args": { "External id": 16151,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650680059.386, "dur": 3.024, "args": { "External id": 16152,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650680065.791, "dur": 184.587, "args": { "External id": 16153,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650680067.274, "dur": 0.461, "args": { "External id": 16154,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650680070.472, "dur": 22.176, "args": { "External id": 16155,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650680094.218, "dur": 4.767, "args": { "External id": 16156,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650680096.055, "dur": 2.612, "args": { "External id": 16157,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650680099.853, "dur": 20.738, "args": { "External id": 16158,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650680100.986, "dur": 1.516, "args": { "External id": 16159,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650680103.922, "dur": 16.424, "args": { "External id": 16160,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650680106.785, "dur": 2.791, "args": { "External id": 16161,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650680122.082, "dur": 20.879, "args": { "External id": 16162,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650680144.087, "dur": 12.420, "args": { "External id": 16163,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650680159.667, "dur": 14.136, "args": { "External id": 16164,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650680176.766, "dur": 12.005, "args": { "External id": 16165,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650680190.161, "dur": 20.240, "args": { "External id": 16166,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650680191.992, "dur": 1.748, "args": { "External id": 16167,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650680195.302, "dur": 2.447, "args": { "External id": 16168,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650680211.513, "dur": 11.140, "args": { "External id": 16169,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650680223.607, "dur": 24.834, "args": { "External id": 16170,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650680261.188, "dur": 2.425, "args": { "External id": 16171,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650680273.164, "dur": 3.594, "args": { "External id": 16172,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650680275.388, "dur": 0.413, "args": { "External id": 16173,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650680343.998, "dur": 54.785, "args": { "External id": 16174,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650680403.630, "dur": 4.639, "args": { "External id": 16175,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650680406.625, "dur": 0.657, "args": { "External id": 16176,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650680409.792, "dur": 24.500, "args": { "External id": 16177,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650680439.062, "dur": 6.830, "args": { "External id": 16178,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650680440.411, "dur": 4.868, "args": { "External id": 16179,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9674 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650680443.695, "dur": 1.416, "args": { "External id": 16180,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9675 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650680448.729, "dur": 39.224, "args": { "External id": 16181,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650680449.705, "dur": 37.763, "args": { "External id": 16182,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9677 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650680491.860, "dur": 14.367, "args": { "External id": 16183,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650680511.900, "dur": 3.738, "args": { "External id": 16184,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9679 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650680513.807, "dur": 0.972, "args": { "External id": 16185,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650680521.397, "dur": 45.295, "args": { "External id": 16186,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650680522.251, "dur": 3.178, "args": { "External id": 16187,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650680522.920, "dur": 2.043, "args": { "External id": 16188,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650680524.166, "dur": 0.667, "args": { "External id": 16189,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650680526.240, "dur": 40.124, "args": { "External id": 16190,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650680526.682, "dur": 39.198, "args": { "External id": 16191,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650680584.716, "dur": 4.179, "args": { "External id": 16192,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650680587.088, "dur": 0.589, "args": { "External id": 16193,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650680595.990, "dur": 1.295, "args": { "External id": 16194,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650680604.488, "dur": 7.636, "args": { "External id": 16195,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650680606.162, "dur": 5.688, "args": { "External id": 16196,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650680691.639, "dur": 171.497, "args": { "External id": 16197,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650680693.450, "dur": 2.356, "args": { "External id": 16198,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650680697.249, "dur": 165.162, "args": { "External id": 16199,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9694 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650680698.849, "dur": 0.375, "args": { "External id": 16200,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650680701.819, "dur": 21.055, "args": { "External id": 16201,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650680724.653, "dur": 3.091, "args": { "External id": 16202,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650680726.509, "dur": 1.059, "args": { "External id": 16203,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650680728.581, "dur": 22.357, "args": { "External id": 16204,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650680729.913, "dur": 1.961, "args": { "External id": 16205,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650680732.883, "dur": 17.766, "args": { "External id": 16206,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650680737.190, "dur": 2.222, "args": { "External id": 16207,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650680752.232, "dur": 19.251, "args": { "External id": 16208,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650680772.598, "dur": 12.792, "args": { "External id": 16209,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650680787.654, "dur": 12.406, "args": { "External id": 16210,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650680802.939, "dur": 11.857, "args": { "External id": 16211,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650680816.351, "dur": 17.664, "args": { "External id": 16212,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650680818.248, "dur": 1.299, "args": { "External id": 16213,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650680821.089, "dur": 0.788, "args": { "External id": 16214,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650680835.242, "dur": 13.583, "args": { "External id": 16215,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650680849.693, "dur": 11.746, "args": { "External id": 16216,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650680870.633, "dur": 1.632, "args": { "External id": 16217,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650680879.664, "dur": 3.062, "args": { "External id": 16218,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650680881.561, "dur": 0.469, "args": { "External id": 16219,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650680941.576, "dur": 81.549, "args": { "External id": 16220,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650681029.579, "dur": 5.671, "args": { "External id": 16221,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650681032.627, "dur": 1.070, "args": { "External id": 16222,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650681036.686, "dur": 25.285, "args": { "External id": 16223,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9718 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650681067.553, "dur": 7.215, "args": { "External id": 16224,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650681070.833, "dur": 3.311, "args": { "External id": 16225,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9720 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650681072.862, "dur": 1.084, "args": { "External id": 16226,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650681080.507, "dur": 42.845, "args": { "External id": 16227,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650681081.698, "dur": 41.036, "args": { "External id": 16228,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650681127.571, "dur": 15.868, "args": { "External id": 16229,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650681149.042, "dur": 5.330, "args": { "External id": 16230,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650681152.878, "dur": 0.741, "args": { "External id": 16231,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650681158.397, "dur": 87.417, "args": { "External id": 16232,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650681159.098, "dur": 3.220, "args": { "External id": 16233,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9728 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650681160.126, "dur": 1.736, "args": { "External id": 16234,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650681161.081, "dur": 0.589, "args": { "External id": 16235,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650681162.936, "dur": 82.331, "args": { "External id": 16236,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650681163.483, "dur": 80.956, "args": { "External id": 16237,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650681253.589, "dur": 6.458, "args": { "External id": 16238,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650681255.999, "dur": 2.608, "args": { "External id": 16239,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650681266.539, "dur": 1.578, "args": { "External id": 16240,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650681275.672, "dur": 6.529, "args": { "External id": 16241,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650681277.678, "dur": 4.250, "args": { "External id": 16242,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650681369.997, "dur": 170.672, "args": { "External id": 16243,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650681371.798, "dur": 1.898, "args": { "External id": 16244,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650681375.521, "dur": 164.647, "args": { "External id": 16245,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650681377.006, "dur": 0.571, "args": { "External id": 16246,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650681378.458, "dur": 22.408, "args": { "External id": 16247,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650681402.629, "dur": 2.884, "args": { "External id": 16248,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650681404.482, "dur": 0.730, "args": { "External id": 16249,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650681406.601, "dur": 24.417, "args": { "External id": 16250,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650681407.789, "dur": 1.688, "args": { "External id": 16251,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650681412.105, "dur": 18.637, "args": { "External id": 16252,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650681416.186, "dur": 2.605, "args": { "External id": 16253,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650681432.413, "dur": 20.961, "args": { "External id": 16254,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650681454.600, "dur": 11.808, "args": { "External id": 16255,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650681469.089, "dur": 13.717, "args": { "External id": 16256,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650681484.090, "dur": 11.240, "args": { "External id": 16257,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650681496.918, "dur": 18.643, "args": { "External id": 16258,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650681498.432, "dur": 1.601, "args": { "External id": 16259,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650681503.188, "dur": 0.748, "args": { "External id": 16260,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650681516.787, "dur": 10.962, "args": { "External id": 16261,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650681528.887, "dur": 10.329, "args": { "External id": 16262,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650681546.517, "dur": 1.575, "args": { "External id": 16263,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650681556.178, "dur": 3.183, "args": { "External id": 16264,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650681558.250, "dur": 0.423, "args": { "External id": 16265,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650681617.023, "dur": 49.610, "args": { "External id": 16266,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650681671.152, "dur": 5.962, "args": { "External id": 16267,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650681675.015, "dur": 1.049, "args": { "External id": 16268,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650681678.312, "dur": 21.305, "args": { "External id": 16269,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650681703.592, "dur": 4.414, "args": { "External id": 16270,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650681704.763, "dur": 2.627, "args": { "External id": 16271,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650681706.302, "dur": 0.936, "args": { "External id": 16272,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650681710.228, "dur": 36.960, "args": { "External id": 16273,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650681711.493, "dur": 35.230, "args": { "External id": 16274,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650681752.777, "dur": 13.207, "args": { "External id": 16275,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650681771.083, "dur": 3.029, "args": { "External id": 16276,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650681772.711, "dur": 0.617, "args": { "External id": 16277,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650681777.429, "dur": 47.726, "args": { "External id": 16278,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650681778.339, "dur": 6.591, "args": { "External id": 16279,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650681778.940, "dur": 5.487, "args": { "External id": 16280,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650681783.715, "dur": 0.532, "args": { "External id": 16281,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650681785.551, "dur": 39.212, "args": { "External id": 16282,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650681786.076, "dur": 37.981, "args": { "External id": 16283,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650681835.374, "dur": 3.443, "args": { "External id": 16284,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650681836.995, "dur": 0.664, "args": { "External id": 16285,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650681843.578, "dur": 1.227, "args": { "External id": 16286,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650681851.451, "dur": 6.559, "args": { "External id": 16287,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650681854.445, "dur": 3.318, "args": { "External id": 16288,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650681929.868, "dur": 208.281, "args": { "External id": 16289,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650681933.156, "dur": 2.180, "args": { "External id": 16290,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650681936.787, "dur": 200.749, "args": { "External id": 16291,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650681938.039, "dur": 0.313, "args": { "External id": 16292,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650681939.027, "dur": 17.417, "args": { "External id": 16293,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650681958.112, "dur": 4.348, "args": { "External id": 16294,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650681961.175, "dur": 1.017, "args": { "External id": 16295,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650681963.116, "dur": 58.999, "args": { "External id": 16296,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650681964.197, "dur": 1.799, "args": { "External id": 16297,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650681968.813, "dur": 52.589, "args": { "External id": 16298,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650681970.896, "dur": 2.488, "args": { "External id": 16299,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650682024.195, "dur": 21.637, "args": { "External id": 16300,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650682047.194, "dur": 15.390, "args": { "External id": 16301,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650682065.470, "dur": 12.768, "args": { "External id": 16302,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650682079.463, "dur": 11.720, "args": { "External id": 16303,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650682092.981, "dur": 19.828, "args": { "External id": 16304,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650682095.024, "dur": 1.514, "args": { "External id": 16305,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650682099.732, "dur": 0.790, "args": { "External id": 16306,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650682114.071, "dur": 11.133, "args": { "External id": 16307,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650682126.039, "dur": 10.437, "args": { "External id": 16308,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650682145.418, "dur": 1.921, "args": { "External id": 16309,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650682155.241, "dur": 3.155, "args": { "External id": 16310,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650682157.181, "dur": 0.506, "args": { "External id": 16311,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650682219.570, "dur": 69.948, "args": { "External id": 16312,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650682296.104, "dur": 7.349, "args": { "External id": 16313,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650682301.083, "dur": 0.924, "args": { "External id": 16314,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650682304.670, "dur": 24.150, "args": { "External id": 16315,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650682333.945, "dur": 4.959, "args": { "External id": 16316,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650682335.230, "dur": 2.963, "args": { "External id": 16317,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650682336.668, "dur": 1.332, "args": { "External id": 16318,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650682341.600, "dur": 41.457, "args": { "External id": 16319,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650682344.677, "dur": 37.860, "args": { "External id": 16320,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650682386.773, "dur": 13.698, "args": { "External id": 16321,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650682405.807, "dur": 3.627, "args": { "External id": 16322,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650682407.940, "dur": 0.726, "args": { "External id": 16323,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650682413.212, "dur": 53.164, "args": { "External id": 16324,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650682421.516, "dur": 4.857, "args": { "External id": 16325,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650682423.888, "dur": 2.011, "args": { "External id": 16326,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650682425.057, "dur": 0.711, "args": { "External id": 16327,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650682426.949, "dur": 39.099, "args": { "External id": 16328,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650682427.566, "dur": 38.033, "args": { "External id": 16329,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650682470.254, "dur": 3.565, "args": { "External id": 16330,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650682471.981, "dur": 0.685, "args": { "External id": 16331,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650682481.170, "dur": 1.203, "args": { "External id": 16332,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650682489.692, "dur": 7.743, "args": { "External id": 16333,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650682491.305, "dur": 5.862, "args": { "External id": 16334,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650682581.869, "dur": 169.797, "args": { "External id": 16335,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650682583.904, "dur": 2.299, "args": { "External id": 16336,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650682587.823, "dur": 163.270, "args": { "External id": 16337,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650682590.923, "dur": 0.585, "args": { "External id": 16338,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650682592.510, "dur": 20.978, "args": { "External id": 16339,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650682615.313, "dur": 2.815, "args": { "External id": 16340,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650682617.224, "dur": 0.633, "args": { "External id": 16341,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650682619.169, "dur": 22.083, "args": { "External id": 16342,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650682620.182, "dur": 1.760, "args": { "External id": 16343,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650682622.966, "dur": 18.015, "args": { "External id": 16344,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650682627.152, "dur": 2.492, "args": { "External id": 16345,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650682642.600, "dur": 19.368, "args": { "External id": 16346,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650682663.065, "dur": 11.825, "args": { "External id": 16347,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650682680.123, "dur": 12.912, "args": { "External id": 16348,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650682694.126, "dur": 11.124, "args": { "External id": 16349,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650682707.135, "dur": 18.791, "args": { "External id": 16350,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650682708.768, "dur": 1.735, "args": { "External id": 16351,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650682712.596, "dur": 0.680, "args": { "External id": 16352,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650682727.242, "dur": 10.754, "args": { "External id": 16353,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650682740.554, "dur": 9.662, "args": { "External id": 16354,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650682757.744, "dur": 1.638, "args": { "External id": 16355,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650682767.146, "dur": 3.073, "args": { "External id": 16356,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650682769.175, "dur": 0.349, "args": { "External id": 16357,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650682831.089, "dur": 44.269, "args": { "External id": 16358,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650682879.333, "dur": 3.836, "args": { "External id": 16359,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650682881.549, "dur": 0.642, "args": { "External id": 16360,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650682884.392, "dur": 20.964, "args": { "External id": 16361,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650682909.638, "dur": 6.676, "args": { "External id": 16362,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650682912.533, "dur": 3.173, "args": { "External id": 16363,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650682914.298, "dur": 1.220, "args": { "External id": 16364,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650682918.564, "dur": 40.218, "args": { "External id": 16365,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650682919.435, "dur": 38.741, "args": { "External id": 16366,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650682962.093, "dur": 13.120, "args": { "External id": 16367,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650682980.057, "dur": 42.852, "args": { "External id": 16368,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650682983.444, "dur": 0.591, "args": { "External id": 16369,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650683028.453, "dur": 50.805, "args": { "External id": 16370,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650683029.190, "dur": 4.176, "args": { "External id": 16371,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650683030.257, "dur": 2.651, "args": { "External id": 16372,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650683031.936, "dur": 0.842, "args": { "External id": 16373,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650683034.150, "dur": 44.758, "args": { "External id": 16374,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650683034.854, "dur": 43.404, "args": { "External id": 16375,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650683083.843, "dur": 5.233, "args": { "External id": 16376,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650683085.726, "dur": 2.115, "args": { "External id": 16377,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650683097.438, "dur": 1.456, "args": { "External id": 16378,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650683106.191, "dur": 5.868, "args": { "External id": 16379,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650683107.915, "dur": 3.898, "args": { "External id": 16380,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650683193.597, "dur": 219.491, "args": { "External id": 16381,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650683195.720, "dur": 2.267, "args": { "External id": 16382,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650683201.089, "dur": 211.507, "args": { "External id": 16383,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650683202.347, "dur": 0.517, "args": { "External id": 16384,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650683248.053, "dur": 26.524, "args": { "External id": 16385,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650683277.015, "dur": 3.335, "args": { "External id": 16386,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650683279.156, "dur": 0.896, "args": { "External id": 16387,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650683281.117, "dur": 21.919, "args": { "External id": 16388,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650683281.931, "dur": 1.835, "args": { "External id": 16389,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650683284.835, "dur": 17.891, "args": { "External id": 16390,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650683289.053, "dur": 2.897, "args": { "External id": 16391,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650683304.421, "dur": 20.511, "args": { "External id": 16392,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650683326.034, "dur": 12.585, "args": { "External id": 16393,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650683342.622, "dur": 12.851, "args": { "External id": 16394,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650683356.594, "dur": 11.504, "args": { "External id": 16395,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650683369.616, "dur": 17.719, "args": { "External id": 16396,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650683371.356, "dur": 1.341, "args": { "External id": 16397,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650683374.407, "dur": 0.589, "args": { "External id": 16398,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650683388.611, "dur": 11.103, "args": { "External id": 16399,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650683402.233, "dur": 9.490, "args": { "External id": 16400,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650683420.736, "dur": 2.173, "args": { "External id": 16401,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650683431.802, "dur": 3.144, "args": { "External id": 16402,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650683433.806, "dur": 0.356, "args": { "External id": 16403,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650683500.435, "dur": 52.436, "args": { "External id": 16404,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650683557.301, "dur": 4.316, "args": { "External id": 16405,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650683559.647, "dur": 0.901, "args": { "External id": 16406,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650683562.795, "dur": 21.801, "args": { "External id": 16407,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650683590.953, "dur": 5.101, "args": { "External id": 16408,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650683592.432, "dur": 2.774, "args": { "External id": 16409,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650683594.099, "dur": 0.960, "args": { "External id": 16410,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650683598.544, "dur": 37.673, "args": { "External id": 16411,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650683599.415, "dur": 36.171, "args": { "External id": 16412,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650683639.709, "dur": 12.720, "args": { "External id": 16413,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650683657.148, "dur": 5.770, "args": { "External id": 16414,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650683661.515, "dur": 0.621, "args": { "External id": 16415,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9910 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650683666.331, "dur": 45.802, "args": { "External id": 16416,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650683667.028, "dur": 4.235, "args": { "External id": 16417,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650683667.628, "dur": 3.156, "args": { "External id": 16418,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650683668.748, "dur": 1.871, "args": { "External id": 16419,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650683672.074, "dur": 39.762, "args": { "External id": 16420,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650683674.115, "dur": 37.134, "args": { "External id": 16421,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650683715.712, "dur": 3.491, "args": { "External id": 16422,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650683717.581, "dur": 0.648, "args": { "External id": 16423,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650683724.092, "dur": 1.390, "args": { "External id": 16424,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650683732.585, "dur": 6.884, "args": { "External id": 16425,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650683736.011, "dur": 3.195, "args": { "External id": 16426,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650683814.042, "dur": 159.102, "args": { "External id": 16427,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650683816.148, "dur": 1.663, "args": { "External id": 16428,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650683819.448, "dur": 153.246, "args": { "External id": 16429,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650683820.475, "dur": 0.300, "args": { "External id": 16430,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650683823.468, "dur": 17.513, "args": { "External id": 16431,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650683842.459, "dur": 2.650, "args": { "External id": 16432,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650683844.264, "dur": 0.635, "args": { "External id": 16433,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650683845.748, "dur": 25.515, "args": { "External id": 16434,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650683852.211, "dur": 2.598, "args": { "External id": 16435,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650683856.068, "dur": 14.883, "args": { "External id": 16436,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650683858.111, "dur": 2.411, "args": { "External id": 16437,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650683872.399, "dur": 17.436, "args": { "External id": 16438,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650683890.825, "dur": 10.781, "args": { "External id": 16439,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650683903.915, "dur": 12.342, "args": { "External id": 16440,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650683917.310, "dur": 10.340, "args": { "External id": 16441,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650683929.580, "dur": 18.663, "args": { "External id": 16442,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650683930.757, "dur": 1.457, "args": { "External id": 16443,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650683935.552, "dur": 0.695, "args": { "External id": 16444,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650683949.331, "dur": 10.749, "args": { "External id": 16445,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650683960.825, "dur": 11.016, "args": { "External id": 16446,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650683978.857, "dur": 1.407, "args": { "External id": 16447,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650684025.556, "dur": 4.731, "args": { "External id": 16448,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650684028.265, "dur": 0.899, "args": { "External id": 16449,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650684096.144, "dur": 51.816, "args": { "External id": 16450,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650684152.663, "dur": 5.531, "args": { "External id": 16451,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650684156.285, "dur": 0.939, "args": { "External id": 16452,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650684159.398, "dur": 23.499, "args": { "External id": 16453,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650684187.210, "dur": 5.146, "args": { "External id": 16454,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650684188.407, "dur": 3.265, "args": { "External id": 16455,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650684190.414, "dur": 1.045, "args": { "External id": 16456,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650684194.836, "dur": 54.618, "args": { "External id": 16457,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650684197.485, "dur": 51.122, "args": { "External id": 16458,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650684254.754, "dur": 15.321, "args": { "External id": 16459,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650684274.934, "dur": 23.289, "args": { "External id": 16460,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650684277.087, "dur": 20.776, "args": { "External id": 16461,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650684283.583, "dur": 0.753, "args": { "External id": 16462,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650684303.341, "dur": 27.356, "args": { "External id": 16463,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650684304.915, "dur": 25.496, "args": { "External id": 16464,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], [], []], "Ev Idx": 9959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650684309.463, "dur": 4.101, "args": { "External id": 16465,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650684317.095, "dur": 12.876, "args": { "External id": 16466,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1336759, "ts": 1295650684342.417, "dur": 4.826, "args": { "External id": 16467,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9962 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1336759, "ts": 1295650684344.244, "dur": 2.687, "args": { "External id": 16468,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1336759, "ts": 1295650684348.389, "dur": 1.029, "args": { "External id": 16469,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9964 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1336759, "ts": 1295650684348.904, "dur": 0.442, "args": { "External id": 16470,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650684393.494, "dur": 19.946, "args": { "External id": 16471,"Sequence number": 246760, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 9966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650684414.952, "dur": 12.814, "args": { "External id": 16472,"Sequence number": 246761, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 9967 } }, { "ph": "s", "id": 9, "pid": 1336759, "tid": 1336759, "ts": 1295650684414.952, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650684433.612, "dur": 5.902, "args": { "External id": 16473,"Sequence number": 246762, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 9968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650684437.090, "dur": 0.954, "args": { "External id": 16474,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336759, "tid": 1336759, "ts": 1295650684447.175, "dur": 6.504, "args": { "External id": 16475,"Sequence number": 246762, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "3"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 9970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650684451.366, "dur": 1.081, "args": { "External id": 16476,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "4"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650684454.858, "dur": 2.868, "args": { "External id": 16477,"Sequence number": 246762, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 9972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650684456.251, "dur": 0.900, "args": { "External id": 16478,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "4"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 9973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650684463.344, "dur": 5.933, "args": { "External id": 16479,"Sequence number": 246762, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9974 } }, { "ph": "s", "id": 8, "pid": 1336759, "tid": 1336759, "ts": 1295650684463.344, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650684466.569, "dur": 1.396, "args": { "External id": 16480,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650684470.450, "dur": 5.086, "args": { "External id": 16481,"Sequence number": 246763, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9976 } }, { "ph": "s", "id": 7, "pid": 1336759, "tid": 1336759, "ts": 1295650684470.450, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650684473.890, "dur": 0.900, "args": { "External id": 16482,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336759, "tid": 1336759, "ts": 1295650684476.406, "dur": 6.989, "args": { "External id": 16483,"Sequence number": 246764, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "3"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 9978 } }, { "ph": "s", "id": 6, "pid": 1336759, "tid": 1336759, "ts": 1295650684476.406, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650684481.703, "dur": 0.874, "args": { "External id": 16484,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "6144"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650684484.430, "dur": 5.727, "args": { "External id": 16485,"Sequence number": 246765, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 9980 } }, { "ph": "s", "id": 5, "pid": 1336759, "tid": 1336759, "ts": 1295650684484.430, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650684487.175, "dur": 2.204, "args": { "External id": 16486,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "6144"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 9981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336759, "tid": 1336759, "ts": 1295650684494.410, "dur": 33.163, "args": { "External id": 16487,"Sequence number": 246766, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1336759, "ts": 1295650684496.381, "dur": 30.993, "args": { "External id": 16488,"Sequence number": 246766, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650684498.838, "dur": 6.008, "args": { "External id": 16489,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 9984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650684501.052, "dur": 3.126, "args": { "External id": 16490,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650684505.490, "dur": 21.477, "args": { "External id": 16491,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 9986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650684551.514, "dur": 4.944, "args": { "External id": 16492,"Sequence number": 246766, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 9987 } }, { "ph": "s", "id": 4, "pid": 1336759, "tid": 1336759, "ts": 1295650684551.514, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650684558.654, "dur": 1.059, "args": { "External id": 16493,"Sequence number": 246767, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9988 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 1336759, "tid": 1336759, "ts": 1295650684591.590, "dur": 44597.407, "args": { "External id": 16494,"Sequence number": 246767, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [1], [2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536], [32000, 2048], [], [], [], [], []], "Ev Idx": 9989 } }, { "ph": "s", "id": 3, "pid": 1336759, "tid": 1336759, "ts": 1295650684591.590, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336759, "tid": 1336759, "ts": 1295650684604.896, "dur": 23.894, "args": { "External id": 16495,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1336759, "ts": 1295650684605.482, "dur": 23.111, "args": { "External id": 16496,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650684606.443, "dur": 6.301, "args": { "External id": 16497,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650684607.804, "dur": 4.504, "args": { "External id": 16498,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650684613.360, "dur": 14.775, "args": { "External id": 16499,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [8192, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 9994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336759, "tid": 1336759, "ts": 1295650684644.527, "dur": 25.171, "args": { "External id": 16500,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650684645.717, "dur": 7.769, "args": { "External id": 16501,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650684649.612, "dur": 3.414, "args": { "External id": 16502,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1336759, "ts": 1295650684655.048, "dur": 14.432, "args": { "External id": 16503,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650684656.747, "dur": 12.265, "args": { "External id": 16504,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336759, "tid": 1336759, "ts": 1295650684672.828, "dur": 16.991, "args": { "External id": 16505,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 10000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650684673.509, "dur": 4.148, "args": { "External id": 16506,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 10001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650684675.034, "dur": 2.382, "args": { "External id": 16507,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1336759, "ts": 1295650684678.303, "dur": 11.321, "args": { "External id": 16508,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650684678.727, "dur": 10.548, "args": { "External id": 16509,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[32000, 2048], []], "Ev Idx": 10004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1336759, "ts": 1295650684695.076, "dur": 16.277, "args": { "External id": 16510,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 10005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650684698.225, "dur": 2.877, "args": { "External id": 16511,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1336759, "ts": 1295650684701.700, "dur": 9.395, "args": { "External id": 16512,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 10007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650684702.184, "dur": 8.612, "args": { "External id": 16513,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 10008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336759, "tid": 1336759, "ts": 1295650684715.877, "dur": 21.253, "args": { "External id": 16514,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 10009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650684739.885, "dur": 43.052, "args": { "External id": 16515,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 10010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650684741.315, "dur": 41.257, "args": { "External id": 16516,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650684747.259, "dur": 0.714, "args": { "External id": 16517,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650684749.407, "dur": 19.163, "args": { "External id": 16518,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650684750.753, "dur": 17.638, "args": { "External id": 16519,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 10014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650684752.933, "dur": 2.574, "args": { "External id": 16520,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10015 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650684756.297, "dur": 11.691, "args": { "External id": 16521,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 10016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336759, "tid": 1336759, "ts": 1295650684788.128, "dur": 38923.616, "args": { "External id": 16522,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 10017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336759, "tid": 1336759, "ts": 1295650684789.831, "dur": 38919.085, "args": { "External id": 16523,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 10018 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650723727.777, "dur": 8.502, "args": { "External id": 16524,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650723732.876, "dur": 1.486, "args": { "External id": 16525,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650723741.866, "dur": 107.072, "args": { "External id": 16526,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650723743.285, "dur": 8.545, "args": { "External id": 16527,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650723746.038, "dur": 5.042, "args": { "External id": 16528,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650723749.860, "dur": 0.930, "args": { "External id": 16529,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650723753.103, "dur": 95.152, "args": { "External id": 16530,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650723754.863, "dur": 92.678, "args": { "External id": 16531,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650723852.306, "dur": 3.877, "args": { "External id": 16532,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650723854.385, "dur": 0.668, "args": { "External id": 16533,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650723863.657, "dur": 2.593, "args": { "External id": 16534,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650723877.440, "dur": 7.040, "args": { "External id": 16535,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650723879.817, "dur": 4.371, "args": { "External id": 16536,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650724044.612, "dur": 205.917, "args": { "External id": 16537,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650724049.150, "dur": 3.504, "args": { "External id": 16538,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650724054.041, "dur": 195.944, "args": { "External id": 16539,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650724055.639, "dur": 0.420, "args": { "External id": 16540,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650724057.393, "dur": 25.349, "args": { "External id": 16541,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650724086.938, "dur": 4.985, "args": { "External id": 16542,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650724090.531, "dur": 1.026, "args": { "External id": 16543,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650724092.804, "dur": 22.725, "args": { "External id": 16544,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650724093.937, "dur": 1.610, "args": { "External id": 16545,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650724096.717, "dur": 18.570, "args": { "External id": 16546,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650724100.412, "dur": 3.410, "args": { "External id": 16547,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650724117.204, "dur": 23.423, "args": { "External id": 16548,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650724142.357, "dur": 13.919, "args": { "External id": 16549,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650724159.342, "dur": 14.324, "args": { "External id": 16550,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650724175.171, "dur": 12.574, "args": { "External id": 16551,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650724191.236, "dur": 19.308, "args": { "External id": 16552,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650724193.378, "dur": 1.351, "args": { "External id": 16553,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650724196.766, "dur": 0.621, "args": { "External id": 16554,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650724211.811, "dur": 11.668, "args": { "External id": 16555,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650724224.894, "dur": 23.016, "args": { "External id": 16556,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650724259.734, "dur": 2.555, "args": { "External id": 16557,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650724271.137, "dur": 4.169, "args": { "External id": 16558,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650724273.252, "dur": 1.031, "args": { "External id": 16559,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650724352.371, "dur": 69.418, "args": { "External id": 16560,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650724427.317, "dur": 5.833, "args": { "External id": 16561,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650724430.061, "dur": 0.883, "args": { "External id": 16562,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650724434.802, "dur": 27.254, "args": { "External id": 16563,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650724467.636, "dur": 7.680, "args": { "External id": 16564,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650724469.363, "dur": 5.333, "args": { "External id": 16565,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650724473.181, "dur": 1.263, "args": { "External id": 16566,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650724478.374, "dur": 42.538, "args": { "External id": 16567,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650724479.693, "dur": 40.642, "args": { "External id": 16568,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650724525.628, "dur": 15.816, "args": { "External id": 16569,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650724547.492, "dur": 3.546, "args": { "External id": 16570,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650724549.646, "dur": 0.718, "args": { "External id": 16571,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650724557.121, "dur": 46.703, "args": { "External id": 16572,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650724557.978, "dur": 3.886, "args": { "External id": 16573,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650724558.939, "dur": 2.344, "args": { "External id": 16574,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650724560.142, "dur": 0.995, "args": { "External id": 16575,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650724562.382, "dur": 41.014, "args": { "External id": 16576,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650724563.284, "dur": 39.652, "args": { "External id": 16577,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650724609.849, "dur": 5.052, "args": { "External id": 16578,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650724611.772, "dur": 2.013, "args": { "External id": 16579,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650724621.169, "dur": 1.462, "args": { "External id": 16580,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650724630.413, "dur": 6.465, "args": { "External id": 16581,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650724632.152, "dur": 4.456, "args": { "External id": 16582,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650724729.673, "dur": 177.963, "args": { "External id": 16583,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650724731.567, "dur": 2.315, "args": { "External id": 16584,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650724735.494, "dur": 171.570, "args": { "External id": 16585,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650724736.899, "dur": 0.423, "args": { "External id": 16586,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650724738.251, "dur": 21.052, "args": { "External id": 16587,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650724760.846, "dur": 3.394, "args": { "External id": 16588,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650724763.151, "dur": 0.858, "args": { "External id": 16589,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650724765.413, "dur": 31.867, "args": { "External id": 16590,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650724766.358, "dur": 8.345, "args": { "External id": 16591,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650724775.680, "dur": 21.278, "args": { "External id": 16592,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650724781.921, "dur": 4.222, "args": { "External id": 16593,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650724798.756, "dur": 20.217, "args": { "External id": 16594,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650724820.105, "dur": 13.197, "args": { "External id": 16595,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650724836.457, "dur": 12.586, "args": { "External id": 16596,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650724850.337, "dur": 11.100, "args": { "External id": 16597,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650724862.981, "dur": 17.741, "args": { "External id": 16598,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650724864.627, "dur": 1.661, "args": { "External id": 16599,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650724868.389, "dur": 0.704, "args": { "External id": 16600,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650724883.784, "dur": 11.250, "args": { "External id": 16601,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650724895.937, "dur": 10.249, "args": { "External id": 16602,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650724913.584, "dur": 1.754, "args": { "External id": 16603,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650724923.497, "dur": 3.456, "args": { "External id": 16604,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650724925.701, "dur": 0.431, "args": { "External id": 16605,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650725032.727, "dur": 56.890, "args": { "External id": 16606,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650725094.814, "dur": 5.899, "args": { "External id": 16607,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650725097.966, "dur": 1.436, "args": { "External id": 16608,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650725104.296, "dur": 24.961, "args": { "External id": 16609,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650725134.378, "dur": 4.939, "args": { "External id": 16610,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650725135.704, "dur": 3.020, "args": { "External id": 16611,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650725137.690, "dur": 0.817, "args": { "External id": 16612,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650725141.808, "dur": 38.305, "args": { "External id": 16613,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650725142.960, "dur": 36.624, "args": { "External id": 16614,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650725184.433, "dur": 14.828, "args": { "External id": 16615,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650725207.012, "dur": 3.520, "args": { "External id": 16616,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650725208.915, "dur": 0.837, "args": { "External id": 16617,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650725214.431, "dur": 67.685, "args": { "External id": 16618,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650725215.247, "dur": 5.623, "args": { "External id": 16619,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650725215.865, "dur": 4.428, "args": { "External id": 16620,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650725219.279, "dur": 0.881, "args": { "External id": 16621,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650725223.249, "dur": 58.408, "args": { "External id": 16622,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650725224.146, "dur": 56.531, "args": { "External id": 16623,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650725288.201, "dur": 4.362, "args": { "External id": 16624,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650725290.514, "dur": 0.865, "args": { "External id": 16625,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650725299.078, "dur": 1.711, "args": { "External id": 16626,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650725308.097, "dur": 6.393, "args": { "External id": 16627,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10122 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650725310.147, "dur": 4.094, "args": { "External id": 16628,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650725401.904, "dur": 175.816, "args": { "External id": 16629,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650725404.369, "dur": 2.154, "args": { "External id": 16630,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650725407.717, "dur": 169.445, "args": { "External id": 16631,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650725410.996, "dur": 0.423, "args": { "External id": 16632,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650725412.632, "dur": 21.536, "args": { "External id": 16633,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650725435.805, "dur": 3.565, "args": { "External id": 16634,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650725438.120, "dur": 0.948, "args": { "External id": 16635,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650725440.147, "dur": 25.466, "args": { "External id": 16636,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650725443.027, "dur": 1.322, "args": { "External id": 16637,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650725445.302, "dur": 19.950, "args": { "External id": 16638,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650725450.180, "dur": 2.449, "args": { "External id": 16639,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650725466.988, "dur": 21.460, "args": { "External id": 16640,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650725489.605, "dur": 12.050, "args": { "External id": 16641,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650725504.270, "dur": 13.080, "args": { "External id": 16642,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650725518.652, "dur": 11.465, "args": { "External id": 16643,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650725531.690, "dur": 18.745, "args": { "External id": 16644,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650725533.689, "dur": 1.613, "args": { "External id": 16645,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650725537.344, "dur": 0.646, "args": { "External id": 16646,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650725553.576, "dur": 11.193, "args": { "External id": 16647,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650725565.787, "dur": 10.464, "args": { "External id": 16648,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650725584.217, "dur": 1.736, "args": { "External id": 16649,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650725593.912, "dur": 3.420, "args": { "External id": 16650,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650725595.811, "dur": 0.754, "args": { "External id": 16651,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650725659.624, "dur": 47.994, "args": { "External id": 16652,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650725712.406, "dur": 5.684, "args": { "External id": 16653,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650725716.242, "dur": 0.904, "args": { "External id": 16654,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650725719.489, "dur": 29.943, "args": { "External id": 16655,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650725753.509, "dur": 6.236, "args": { "External id": 16656,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650725754.703, "dur": 4.412, "args": { "External id": 16657,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650725756.370, "dur": 2.493, "args": { "External id": 16658,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650725762.358, "dur": 70.219, "args": { "External id": 16659,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650725763.359, "dur": 68.696, "args": { "External id": 16660,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650725838.027, "dur": 37.485, "args": { "External id": 16661,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650725880.605, "dur": 3.413, "args": { "External id": 16662,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650725882.575, "dur": 0.704, "args": { "External id": 16663,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650725887.684, "dur": 71.381, "args": { "External id": 16664,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650725888.376, "dur": 4.636, "args": { "External id": 16665,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650725889.180, "dur": 3.336, "args": { "External id": 16666,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650725891.734, "dur": 0.629, "args": { "External id": 16667,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650725893.721, "dur": 64.931, "args": { "External id": 16668,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650725894.222, "dur": 63.871, "args": { "External id": 16669,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650725962.695, "dur": 16.395, "args": { "External id": 16670,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650725977.357, "dur": 0.645, "args": { "External id": 16671,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650726034.750, "dur": 2.391, "args": { "External id": 16672,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650726047.038, "dur": 8.734, "args": { "External id": 16673,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650726048.728, "dur": 6.748, "args": { "External id": 16674,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650726150.077, "dur": 199.456, "args": { "External id": 16675,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650726152.134, "dur": 2.218, "args": { "External id": 16676,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650726155.803, "dur": 193.159, "args": { "External id": 16677,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650726157.717, "dur": 0.463, "args": { "External id": 16678,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650726159.223, "dur": 23.581, "args": { "External id": 16679,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650726186.381, "dur": 3.854, "args": { "External id": 16680,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10175 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650726188.752, "dur": 1.088, "args": { "External id": 16681,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10176 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650726191.136, "dur": 23.297, "args": { "External id": 16682,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650726192.153, "dur": 1.617, "args": { "External id": 16683,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650726194.905, "dur": 19.278, "args": { "External id": 16684,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650726199.477, "dur": 3.053, "args": { "External id": 16685,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650726215.805, "dur": 36.433, "args": { "External id": 16686,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650726254.882, "dur": 13.905, "args": { "External id": 16687,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650726272.127, "dur": 13.684, "args": { "External id": 16688,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650726287.077, "dur": 11.658, "args": { "External id": 16689,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650726302.962, "dur": 20.625, "args": { "External id": 16690,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650726305.440, "dur": 2.131, "args": { "External id": 16691,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650726309.481, "dur": 0.964, "args": { "External id": 16692,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650726324.893, "dur": 10.944, "args": { "External id": 16693,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650726336.862, "dur": 10.801, "args": { "External id": 16694,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650726356.688, "dur": 2.138, "args": { "External id": 16695,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650726368.463, "dur": 3.903, "args": { "External id": 16696,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650726370.990, "dur": 0.483, "args": { "External id": 16697,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650726442.959, "dur": 61.049, "args": { "External id": 16698,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650726508.748, "dur": 5.190, "args": { "External id": 16699,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650726511.809, "dur": 1.106, "args": { "External id": 16700,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650726515.404, "dur": 24.056, "args": { "External id": 16701,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650726544.085, "dur": 6.904, "args": { "External id": 16702,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650726545.668, "dur": 4.570, "args": { "External id": 16703,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650726548.868, "dur": 1.150, "args": { "External id": 16704,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650726553.627, "dur": 41.270, "args": { "External id": 16705,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650726554.889, "dur": 39.525, "args": { "External id": 16706,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650726599.199, "dur": 13.987, "args": { "External id": 16707,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650726619.028, "dur": 3.741, "args": { "External id": 16708,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650726620.988, "dur": 0.837, "args": { "External id": 16709,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650726626.816, "dur": 49.720, "args": { "External id": 16710,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650726629.413, "dur": 4.817, "args": { "External id": 16711,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650726630.149, "dur": 3.549, "args": { "External id": 16712,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650726631.435, "dur": 2.050, "args": { "External id": 16713,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650726635.000, "dur": 41.134, "args": { "External id": 16714,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650726635.947, "dur": 39.607, "args": { "External id": 16715,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650726680.637, "dur": 3.994, "args": { "External id": 16716,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650726682.688, "dur": 0.866, "args": { "External id": 16717,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650726689.932, "dur": 1.633, "args": { "External id": 16718,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650726700.276, "dur": 5.547, "args": { "External id": 16719,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650726702.012, "dur": 3.556, "args": { "External id": 16720,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650726783.837, "dur": 168.897, "args": { "External id": 16721,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650726785.968, "dur": 2.057, "args": { "External id": 16722,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650726789.330, "dur": 162.911, "args": { "External id": 16723,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650726790.441, "dur": 0.294, "args": { "External id": 16724,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650726795.538, "dur": 18.845, "args": { "External id": 16725,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650726819.682, "dur": 3.119, "args": { "External id": 16726,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650726821.657, "dur": 0.874, "args": { "External id": 16727,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650726823.484, "dur": 20.834, "args": { "External id": 16728,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650726824.551, "dur": 2.802, "args": { "External id": 16729,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650726828.553, "dur": 15.535, "args": { "External id": 16730,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650726830.709, "dur": 2.509, "args": { "External id": 16731,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650726845.741, "dur": 19.019, "args": { "External id": 16732,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650726865.991, "dur": 11.338, "args": { "External id": 16733,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650726879.838, "dur": 12.847, "args": { "External id": 16734,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650726896.376, "dur": 10.729, "args": { "External id": 16735,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650726908.615, "dur": 17.916, "args": { "External id": 16736,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650726910.786, "dur": 1.238, "args": { "External id": 16737,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650726913.695, "dur": 0.649, "args": { "External id": 16738,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650726927.842, "dur": 10.570, "args": { "External id": 16739,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650726939.256, "dur": 10.530, "args": { "External id": 16740,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650726958.463, "dur": 1.428, "args": { "External id": 16741,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650726966.878, "dur": 3.296, "args": { "External id": 16742,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650726968.956, "dur": 0.529, "args": { "External id": 16743,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650727075.702, "dur": 53.149, "args": { "External id": 16744,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650727133.906, "dur": 5.972, "args": { "External id": 16745,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650727136.934, "dur": 1.498, "args": { "External id": 16746,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650727141.212, "dur": 23.262, "args": { "External id": 16747,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650727169.197, "dur": 8.144, "args": { "External id": 16748,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650727172.372, "dur": 4.288, "args": { "External id": 16749,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650727174.040, "dur": 2.379, "args": { "External id": 16750,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650727179.836, "dur": 38.301, "args": { "External id": 16751,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650727181.013, "dur": 36.630, "args": { "External id": 16752,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650727222.334, "dur": 30.505, "args": { "External id": 16753,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650727260.367, "dur": 6.391, "args": { "External id": 16754,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650727264.755, "dur": 0.982, "args": { "External id": 16755,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650727270.899, "dur": 50.531, "args": { "External id": 16756,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650727271.890, "dur": 3.783, "args": { "External id": 16757,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650727272.637, "dur": 2.256, "args": { "External id": 16758,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650727273.840, "dur": 0.904, "args": { "External id": 16759,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650727276.287, "dur": 44.749, "args": { "External id": 16760,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650727277.017, "dur": 43.474, "args": { "External id": 16761,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650727327.153, "dur": 3.673, "args": { "External id": 16762,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650727329.118, "dur": 0.568, "args": { "External id": 16763,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650727336.715, "dur": 1.649, "args": { "External id": 16764,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650727345.229, "dur": 6.501, "args": { "External id": 16765,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650727346.766, "dur": 4.672, "args": { "External id": 16766,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650727432.643, "dur": 170.877, "args": { "External id": 16767,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650727434.874, "dur": 2.285, "args": { "External id": 16768,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650727440.040, "dur": 162.993, "args": { "External id": 16769,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650727441.277, "dur": 0.411, "args": { "External id": 16770,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650727442.674, "dur": 22.125, "args": { "External id": 16771,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650727466.223, "dur": 4.543, "args": { "External id": 16772,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650727468.046, "dur": 2.435, "args": { "External id": 16773,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650727471.713, "dur": 22.501, "args": { "External id": 16774,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650727472.645, "dur": 1.861, "args": { "External id": 16775,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650727477.197, "dur": 16.774, "args": { "External id": 16776,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650727479.800, "dur": 2.431, "args": { "External id": 16777,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650727495.504, "dur": 18.913, "args": { "External id": 16778,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650727515.669, "dur": 12.847, "args": { "External id": 16779,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650727530.819, "dur": 12.334, "args": { "External id": 16780,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650727544.362, "dur": 11.230, "args": { "External id": 16781,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650727557.068, "dur": 21.498, "args": { "External id": 16782,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650727558.910, "dur": 1.608, "args": { "External id": 16783,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650727563.681, "dur": 2.473, "args": { "External id": 16784,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650727580.021, "dur": 10.096, "args": { "External id": 16785,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650727591.264, "dur": 10.561, "args": { "External id": 16786,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650727609.677, "dur": 1.678, "args": { "External id": 16787,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650727618.741, "dur": 2.942, "args": { "External id": 16788,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650727620.551, "dur": 0.349, "args": { "External id": 16789,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650727679.025, "dur": 46.321, "args": { "External id": 16790,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650727729.401, "dur": 5.726, "args": { "External id": 16791,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650727733.202, "dur": 0.958, "args": { "External id": 16792,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650727736.430, "dur": 22.707, "args": { "External id": 16793,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650727763.334, "dur": 4.776, "args": { "External id": 16794,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650727764.602, "dur": 2.915, "args": { "External id": 16795,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650727766.104, "dur": 1.160, "args": { "External id": 16796,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650727770.364, "dur": 38.204, "args": { "External id": 16797,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650727771.490, "dur": 36.441, "args": { "External id": 16798,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650727813.516, "dur": 12.868, "args": { "External id": 16799,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650727831.271, "dur": 3.220, "args": { "External id": 16800,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650727833.052, "dur": 0.678, "args": { "External id": 16801,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650727837.848, "dur": 45.110, "args": { "External id": 16802,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650727838.428, "dur": 4.355, "args": { "External id": 16803,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650727839.140, "dur": 3.127, "args": { "External id": 16804,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650727841.539, "dur": 0.574, "args": { "External id": 16805,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650727843.334, "dur": 39.277, "args": { "External id": 16806,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650727843.887, "dur": 38.250, "args": { "External id": 16807,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650727886.446, "dur": 3.361, "args": { "External id": 16808,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650727888.189, "dur": 0.607, "args": { "External id": 16809,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650727894.622, "dur": 1.280, "args": { "External id": 16810,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650727902.149, "dur": 6.610, "args": { "External id": 16811,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650727904.823, "dur": 3.652, "args": { "External id": 16812,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650727980.040, "dur": 211.631, "args": { "External id": 16813,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650727983.864, "dur": 40.534, "args": { "External id": 16814,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650728027.152, "dur": 163.905, "args": { "External id": 16815,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650728028.585, "dur": 0.348, "args": { "External id": 16816,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650728029.762, "dur": 22.111, "args": { "External id": 16817,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650728053.305, "dur": 4.599, "args": { "External id": 16818,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650728056.700, "dur": 0.909, "args": { "External id": 16819,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650728058.587, "dur": 21.818, "args": { "External id": 16820,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650728059.758, "dur": 1.740, "args": { "External id": 16821,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650728064.326, "dur": 15.746, "args": { "External id": 16822,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650728066.650, "dur": 2.600, "args": { "External id": 16823,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650728081.721, "dur": 20.480, "args": { "External id": 16824,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650728103.264, "dur": 11.379, "args": { "External id": 16825,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650728117.046, "dur": 13.724, "args": { "External id": 16826,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650728132.212, "dur": 10.907, "args": { "External id": 16827,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650728144.790, "dur": 22.026, "args": { "External id": 16828,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650728148.328, "dur": 1.404, "args": { "External id": 16829,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650728153.646, "dur": 0.685, "args": { "External id": 16830,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650728168.097, "dur": 10.858, "args": { "External id": 16831,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650728180.042, "dur": 10.103, "args": { "External id": 16832,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650728198.791, "dur": 2.201, "args": { "External id": 16833,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650728208.861, "dur": 3.665, "args": { "External id": 16834,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650728211.320, "dur": 0.431, "args": { "External id": 16835,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650728292.285, "dur": 53.131, "args": { "External id": 16836,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650728350.556, "dur": 6.920, "args": { "External id": 16837,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650728355.051, "dur": 1.051, "args": { "External id": 16838,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650728358.751, "dur": 23.063, "args": { "External id": 16839,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650728386.248, "dur": 5.559, "args": { "External id": 16840,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650728387.525, "dur": 3.605, "args": { "External id": 16841,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650728389.515, "dur": 1.374, "args": { "External id": 16842,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650728394.509, "dur": 41.188, "args": { "External id": 16843,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650728397.645, "dur": 37.511, "args": { "External id": 16844,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650728439.291, "dur": 13.891, "args": { "External id": 16845,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650728458.297, "dur": 3.133, "args": { "External id": 16846,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650728460.063, "dur": 0.656, "args": { "External id": 16847,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336759, "tid": 1336759, "ts": 1295650728465.249, "dur": 46.467, "args": { "External id": 16848,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650728466.202, "dur": 5.174, "args": { "External id": 16849,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650728466.999, "dur": 3.858, "args": { "External id": 16850,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650728470.099, "dur": 0.603, "args": { "External id": 16851,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650728472.016, "dur": 39.256, "args": { "External id": 16852,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650728472.632, "dur": 38.087, "args": { "External id": 16853,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650728514.937, "dur": 3.753, "args": { "External id": 16854,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650728516.830, "dur": 0.844, "args": { "External id": 16855,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650728524.475, "dur": 1.535, "args": { "External id": 16856,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336759, "tid": 1336759, "ts": 1295650728534.450, "dur": 5.747, "args": { "External id": 16857,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650728536.107, "dur": 3.806, "args": { "External id": 16858,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650728613.265, "dur": 165.687, "args": { "External id": 16859,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650728616.591, "dur": 1.947, "args": { "External id": 16860,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336759, "tid": 1336759, "ts": 1295650728619.655, "dur": 158.829, "args": { "External id": 16861,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336759, "tid": 1336759, "ts": 1295650728620.815, "dur": 0.313, "args": { "External id": 16862,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336759, "tid": 1336759, "ts": 1295650728623.609, "dur": 19.198, "args": { "External id": 16863,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336759, "tid": 1336759, "ts": 1295650728644.275, "dur": 5.104, "args": { "External id": 16864,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650728647.945, "dur": 1.222, "args": { "External id": 16865,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650728650.139, "dur": 18.579, "args": { "External id": 16866,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295650728650.862, "dur": 1.443, "args": { "External id": 16867,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295650728653.437, "dur": 14.989, "args": { "External id": 16868,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650728656.048, "dur": 2.410, "args": { "External id": 16869,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295650728669.977, "dur": 18.825, "args": { "External id": 16870,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650728689.869, "dur": 13.915, "args": { "External id": 16871,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336759, "tid": 1336759, "ts": 1295650728706.355, "dur": 12.285, "args": { "External id": 16872,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336759, "tid": 1336759, "ts": 1295650728721.390, "dur": 11.570, "args": { "External id": 16873,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650728734.382, "dur": 18.969, "args": { "External id": 16874,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295650728736.216, "dur": 1.475, "args": { "External id": 16875,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650728739.348, "dur": 1.996, "args": { "External id": 16876,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336759, "tid": 1336759, "ts": 1295650728754.803, "dur": 10.808, "args": { "External id": 16877,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650728766.377, "dur": 10.889, "args": { "External id": 16878,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295650728786.179, "dur": 1.462, "args": { "External id": 16879,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650728794.479, "dur": 3.029, "args": { "External id": 16880,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650728796.369, "dur": 0.454, "args": { "External id": 16881,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650728854.259, "dur": 45.173, "args": { "External id": 16882,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336759, "tid": 1336759, "ts": 1295650728903.599, "dur": 4.402, "args": { "External id": 16883,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650728906.000, "dur": 1.012, "args": { "External id": 16884,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650728909.066, "dur": 20.568, "args": { "External id": 16885,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336759, "tid": 1336759, "ts": 1295650728933.978, "dur": 6.611, "args": { "External id": 16886,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336759, "tid": 1336759, "ts": 1295650728935.114, "dur": 4.954, "args": { "External id": 16887,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650728938.630, "dur": 1.266, "args": { "External id": 16888,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336759, "tid": 1336759, "ts": 1295650728942.525, "dur": 37.585, "args": { "External id": 16889,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336759, "tid": 1336759, "ts": 1295650728943.543, "dur": 36.071, "args": { "External id": 16890,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650728983.334, "dur": 56.602, "args": { "External id": 16891,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650729046.744, "dur": 27.830, "args": { "External id": 16892,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 10387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336759, "tid": 1336759, "ts": 1295650729049.158, "dur": 25.017, "args": { "External id": 16893,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650729054.553, "dur": 2.406, "args": { "External id": 16894,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295650729079.911, "dur": 65.753, "args": { "External id": 16895,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 10390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336759, "tid": 1336759, "ts": 1295650729081.597, "dur": 63.792, "args": { "External id": 16896,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], [], []], "Ev Idx": 10391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650729124.368, "dur": 5.466, "args": { "External id": 16897,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295650729131.199, "dur": 13.650, "args": { "External id": 16898,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1336759, "ts": 1295650729157.820, "dur": 5.161, "args": { "External id": 16899,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 10394 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1336759, "ts": 1295650729159.889, "dur": 2.768, "args": { "External id": 16900,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 10395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336759, "tid": 1336759, "ts": 1295650729164.098, "dur": 0.988, "args": { "External id": 16901,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10396 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336759, "tid": 1336759, "ts": 1295650729164.397, "dur": 0.411, "args": { "External id": 16902,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650729204.948, "dur": 21.757, "args": { "External id": 16903,"Sequence number": 246768, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 10398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336759, "tid": 1336759, "ts": 1295650729244.289, "dur": 17.072, "args": { "External id": 16904,"Sequence number": 246769, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 10399 } }, { "ph": "s", "id": 2, "pid": 1336759, "tid": 1336759, "ts": 1295650729244.289, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward", "pid": 1336759, "tid": 1336759, "ts": 1295650729366.475, "dur": 39.097, "args": { "External id": 16905,"Record function id": 0, "Ev Idx": 10400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 1336759, "tid": 1336759, "ts": 1295650729504.785, "dur": 34.939, "args": { "External id": 16906,"Sequence number": 246770, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 10401 } }, { "ph": "s", "id": 1, "pid": 1336759, "tid": 1336759, "ts": 1295650729504.785, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::ones_like", "pid": 1336759, "tid": 1336759, "ts": 1295650729594.580, "dur": 25.974, "args": { "External id": 16907,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "1"], "Input type": ["float", "", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[1], [], [], [], [], []], "Ev Idx": 10402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295650729596.140, "dur": 8.610, "args": { "External id": 16908,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "1"], "Input type": ["float", "", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[1], [], [], [], [], []], "Ev Idx": 10403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336759, "tid": 1336759, "ts": 1295650729599.705, "dur": 4.462, "args": { "External id": 16909,"Record function id": 0, "Concrete Inputs": ["[1]", "[1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1336759, "ts": 1295650729606.245, "dur": 14.033, "args": { "External id": 16910,"Record function id": 0, "Concrete Inputs": ["", "1."], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 10405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 1336759, "tid": 1336759, "ts": 1295652033055.480, "dur": 66.055, "args": { "External id": 16911,"Sequence number": 246771, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 1336759, "tid": 1336759, "ts": 1295652033131.928, "dur": 19.227, "args": { "External id": 16912,"Sequence number": 246772, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 10407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336759, "tid": 1336759, "ts": 1295652033157.995, "dur": 19.683, "args": { "External id": 16913,"Sequence number": 246773, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "long int", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 10408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336759, "tid": 1336759, "ts": 1295652033624.655, "dur": 28.281, "args": { "External id": 16914,"Sequence number": 246774, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "long int", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 10409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336759, "tid": 1336759, "ts": 1295652034036.142, "dur": 32.800, "args": { "External id": 16915,"Sequence number": 246775, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "long int", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 10410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_norm", "pid": 1336759, "tid": 1336759, "ts": 1295652035299.355, "dur": 2892.699, "args": { "External id": 16916,"Record function id": 0, "Concrete Inputs": ["", "2.", ""], "Input type": ["TensorList", "Scalar", ""], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 10411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_norm", "pid": 1336759, "tid": 1336759, "ts": 1295652035819.896, "dur": 894.545, "args": { "External id": 16917,"Record function id": 0, "Concrete Inputs": ["", "2.", ""], "Input type": ["TensorList", "Scalar", ""], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 10412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336759, "tid": 1336759, "ts": 1295652035839.578, "dur": 62.061, "args": { "External id": 16918,"Record function id": 0, "Concrete Inputs": ["[36375]", "6", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 10413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295652035842.711, "dur": 14.373, "args": { "External id": 16919,"Record function id": 0, "Concrete Inputs": ["[36375]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336759, "tid": 1336759, "ts": 1295652035859.570, "dur": 41.777, "args": { "External id": 16920,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[36375]], "Ev Idx": 10415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336759, "tid": 1336759, "ts": 1295652035862.261, "dur": 38.415, "args": { "External id": 16921,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[36375], []], "Ev Idx": 10416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038226.900, "dur": 15.599, "args": { "External id": 16922,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038246.707, "dur": 0.408, "args": { "External id": 16923,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038248.522, "dur": 0.460, "args": { "External id": 16924,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038250.093, "dur": 0.346, "args": { "External id": 16925,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038251.518, "dur": 0.262, "args": { "External id": 16926,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038252.962, "dur": 0.443, "args": { "External id": 16927,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038254.835, "dur": 0.451, "args": { "External id": 16928,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038258.175, "dur": 0.336, "args": { "External id": 16929,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038259.531, "dur": 0.208, "args": { "External id": 16930,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038260.655, "dur": 0.353, "args": { "External id": 16931,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038261.827, "dur": 0.201, "args": { "External id": 16932,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038262.920, "dur": 0.219, "args": { "External id": 16933,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038264.048, "dur": 0.203, "args": { "External id": 16934,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038265.068, "dur": 0.199, "args": { "External id": 16935,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038266.141, "dur": 0.196, "args": { "External id": 16936,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038269.035, "dur": 0.236, "args": { "External id": 16937,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038270.102, "dur": 0.196, "args": { "External id": 16938,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038271.218, "dur": 0.206, "args": { "External id": 16939,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038272.202, "dur": 0.199, "args": { "External id": 16940,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038273.251, "dur": 0.215, "args": { "External id": 16941,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038274.257, "dur": 0.198, "args": { "External id": 16942,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038275.246, "dur": 0.203, "args": { "External id": 16943,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038276.722, "dur": 0.200, "args": { "External id": 16944,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038279.074, "dur": 0.208, "args": { "External id": 16945,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038280.228, "dur": 0.262, "args": { "External id": 16946,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038281.457, "dur": 0.341, "args": { "External id": 16947,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038282.544, "dur": 0.298, "args": { "External id": 16948,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038283.717, "dur": 0.353, "args": { "External id": 16949,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038285.014, "dur": 0.215, "args": { "External id": 16950,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038285.977, "dur": 0.213, "args": { "External id": 16951,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038286.927, "dur": 0.366, "args": { "External id": 16952,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038289.613, "dur": 0.322, "args": { "External id": 16953,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038290.732, "dur": 0.198, "args": { "External id": 16954,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038292.108, "dur": 0.218, "args": { "External id": 16955,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038293.075, "dur": 0.199, "args": { "External id": 16956,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038294.021, "dur": 0.202, "args": { "External id": 16957,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038294.966, "dur": 0.198, "args": { "External id": 16958,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038295.903, "dur": 0.212, "args": { "External id": 16959,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038296.863, "dur": 0.199, "args": { "External id": 16960,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038299.308, "dur": 0.202, "args": { "External id": 16961,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038300.363, "dur": 0.213, "args": { "External id": 16962,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038301.537, "dur": 0.220, "args": { "External id": 16963,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038302.523, "dur": 0.214, "args": { "External id": 16964,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038303.602, "dur": 0.202, "args": { "External id": 16965,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038304.633, "dur": 0.198, "args": { "External id": 16966,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038306.711, "dur": 0.230, "args": { "External id": 16967,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038307.995, "dur": 0.215, "args": { "External id": 16968,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038310.657, "dur": 0.201, "args": { "External id": 16969,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038311.995, "dur": 0.196, "args": { "External id": 16970,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038313.015, "dur": 0.202, "args": { "External id": 16971,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038314.040, "dur": 0.215, "args": { "External id": 16972,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038315.162, "dur": 0.201, "args": { "External id": 16973,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038316.137, "dur": 0.196, "args": { "External id": 16974,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038317.296, "dur": 0.243, "args": { "External id": 16975,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038318.326, "dur": 0.333, "args": { "External id": 16976,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038321.393, "dur": 0.319, "args": { "External id": 16977,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038322.485, "dur": 0.299, "args": { "External id": 16978,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10473 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038323.642, "dur": 0.357, "args": { "External id": 16979,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038324.751, "dur": 0.325, "args": { "External id": 16980,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038326.026, "dur": 0.345, "args": { "External id": 16981,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038327.123, "dur": 0.197, "args": { "External id": 16982,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038328.206, "dur": 0.465, "args": { "External id": 16983,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038329.528, "dur": 0.348, "args": { "External id": 16984,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038332.705, "dur": 0.172, "args": { "External id": 16985,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038333.621, "dur": 0.189, "args": { "External id": 16986,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038334.716, "dur": 0.207, "args": { "External id": 16987,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038335.719, "dur": 0.194, "args": { "External id": 16988,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038336.682, "dur": 0.201, "args": { "External id": 16989,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038337.637, "dur": 0.196, "args": { "External id": 16990,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038338.584, "dur": 0.210, "args": { "External id": 16991,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038339.597, "dur": 0.193, "args": { "External id": 16992,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038342.116, "dur": 0.212, "args": { "External id": 16993,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038343.157, "dur": 0.193, "args": { "External id": 16994,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038344.110, "dur": 0.209, "args": { "External id": 16995,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038345.077, "dur": 0.208, "args": { "External id": 16996,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038346.063, "dur": 0.200, "args": { "External id": 16997,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038347.009, "dur": 0.196, "args": { "External id": 16998,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038348.657, "dur": 0.198, "args": { "External id": 16999,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038349.709, "dur": 0.228, "args": { "External id": 17000,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038352.274, "dur": 0.199, "args": { "External id": 17001,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038353.320, "dur": 0.193, "args": { "External id": 17002,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038354.354, "dur": 0.213, "args": { "External id": 17003,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038355.419, "dur": 0.194, "args": { "External id": 17004,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038356.360, "dur": 0.197, "args": { "External id": 17005,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038357.306, "dur": 0.193, "args": { "External id": 17006,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038358.237, "dur": 0.198, "args": { "External id": 17007,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038359.193, "dur": 0.192, "args": { "External id": 17008,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038362.042, "dur": 0.214, "args": { "External id": 17009,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10504 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038363.067, "dur": 0.194, "args": { "External id": 17010,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038364.178, "dur": 0.199, "args": { "External id": 17011,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038365.233, "dur": 0.194, "args": { "External id": 17012,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038366.373, "dur": 0.200, "args": { "External id": 17013,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038367.328, "dur": 0.194, "args": { "External id": 17014,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038368.796, "dur": 0.199, "args": { "External id": 17015,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038369.749, "dur": 0.193, "args": { "External id": 17016,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038372.350, "dur": 0.201, "args": { "External id": 17017,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038373.359, "dur": 0.193, "args": { "External id": 17018,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038374.280, "dur": 0.210, "args": { "External id": 17019,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038375.234, "dur": 0.307, "args": { "External id": 17020,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038376.272, "dur": 0.311, "args": { "External id": 17021,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10516 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038377.361, "dur": 0.364, "args": { "External id": 17022,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10517 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038378.454, "dur": 0.199, "args": { "External id": 17023,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038379.392, "dur": 0.316, "args": { "External id": 17024,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038382.151, "dur": 0.297, "args": { "External id": 17025,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038383.201, "dur": 0.322, "args": { "External id": 17026,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038384.287, "dur": 0.327, "args": { "External id": 17027,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038385.352, "dur": 0.311, "args": { "External id": 17028,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038386.460, "dur": 0.333, "args": { "External id": 17029,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038387.546, "dur": 0.331, "args": { "External id": 17030,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038388.918, "dur": 0.212, "args": { "External id": 17031,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038389.973, "dur": 0.197, "args": { "External id": 17032,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038392.496, "dur": 0.200, "args": { "External id": 17033,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038393.470, "dur": 0.196, "args": { "External id": 17034,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038394.403, "dur": 0.224, "args": { "External id": 17035,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038395.378, "dur": 0.196, "args": { "External id": 17036,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038396.371, "dur": 0.220, "args": { "External id": 17037,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038397.417, "dur": 0.198, "args": { "External id": 17038,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038398.348, "dur": 0.219, "args": { "External id": 17039,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038399.557, "dur": 0.194, "args": { "External id": 17040,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038401.911, "dur": 0.199, "args": { "External id": 17041,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10536 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038402.923, "dur": 0.203, "args": { "External id": 17042,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038403.951, "dur": 0.214, "args": { "External id": 17043,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038404.932, "dur": 0.194, "args": { "External id": 17044,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038405.991, "dur": 0.228, "args": { "External id": 17045,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038406.965, "dur": 0.193, "args": { "External id": 17046,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038407.894, "dur": 0.198, "args": { "External id": 17047,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038408.979, "dur": 0.193, "args": { "External id": 17048,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038411.380, "dur": 0.334, "args": { "External id": 17049,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038412.566, "dur": 0.197, "args": { "External id": 17050,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038413.865, "dur": 0.351, "args": { "External id": 17051,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038415.076, "dur": 0.209, "args": { "External id": 17052,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038416.150, "dur": 0.232, "args": { "External id": 17053,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038417.205, "dur": 0.340, "args": { "External id": 17054,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038418.353, "dur": 0.199, "args": { "External id": 17055,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038419.423, "dur": 0.203, "args": { "External id": 17056,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038421.985, "dur": 0.336, "args": { "External id": 17057,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038423.310, "dur": 0.289, "args": { "External id": 17058,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038424.370, "dur": 0.351, "args": { "External id": 17059,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038425.473, "dur": 0.203, "args": { "External id": 17060,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038426.422, "dur": 0.227, "args": { "External id": 17061,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038427.403, "dur": 0.195, "args": { "External id": 17062,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038428.341, "dur": 0.218, "args": { "External id": 17063,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038429.313, "dur": 0.193, "args": { "External id": 17064,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038431.496, "dur": 0.199, "args": { "External id": 17065,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10560 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038432.492, "dur": 0.193, "args": { "External id": 17066,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038433.432, "dur": 0.197, "args": { "External id": 17067,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038434.419, "dur": 0.193, "args": { "External id": 17068,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038435.356, "dur": 0.198, "args": { "External id": 17069,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038436.344, "dur": 0.206, "args": { "External id": 17070,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10565 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038437.706, "dur": 0.197, "args": { "External id": 17071,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038438.665, "dur": 0.193, "args": { "External id": 17072,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038441.322, "dur": 0.201, "args": { "External id": 17073,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038442.299, "dur": 0.193, "args": { "External id": 17074,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038443.268, "dur": 0.198, "args": { "External id": 17075,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038444.207, "dur": 0.197, "args": { "External id": 17076,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10571 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038445.236, "dur": 0.197, "args": { "External id": 17077,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038446.247, "dur": 0.203, "args": { "External id": 17078,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038447.187, "dur": 0.197, "args": { "External id": 17079,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038448.138, "dur": 0.223, "args": { "External id": 17080,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038451.659, "dur": 0.210, "args": { "External id": 17081,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038452.716, "dur": 0.198, "args": { "External id": 17082,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038453.715, "dur": 0.207, "args": { "External id": 17083,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038454.667, "dur": 0.194, "args": { "External id": 17084,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038455.671, "dur": 0.207, "args": { "External id": 17085,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038456.696, "dur": 0.204, "args": { "External id": 17086,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038457.681, "dur": 0.200, "args": { "External id": 17087,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038458.687, "dur": 0.200, "args": { "External id": 17088,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038461.579, "dur": 0.197, "args": { "External id": 17089,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038462.620, "dur": 0.196, "args": { "External id": 17090,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038463.618, "dur": 0.223, "args": { "External id": 17091,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038464.620, "dur": 0.193, "args": { "External id": 17092,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038465.626, "dur": 0.204, "args": { "External id": 17093,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038466.682, "dur": 0.211, "args": { "External id": 17094,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038467.876, "dur": 0.199, "args": { "External id": 17095,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038468.980, "dur": 0.193, "args": { "External id": 17096,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038471.614, "dur": 0.199, "args": { "External id": 17097,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038472.665, "dur": 0.193, "args": { "External id": 17098,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038473.699, "dur": 0.197, "args": { "External id": 17099,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038474.785, "dur": 0.192, "args": { "External id": 17100,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038475.833, "dur": 0.200, "args": { "External id": 17101,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038476.874, "dur": 0.234, "args": { "External id": 17102,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038477.848, "dur": 0.198, "args": { "External id": 17103,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038478.801, "dur": 0.214, "args": { "External id": 17104,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038481.732, "dur": 0.201, "args": { "External id": 17105,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038482.682, "dur": 0.354, "args": { "External id": 17106,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038483.767, "dur": 0.353, "args": { "External id": 17107,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038484.862, "dur": 0.305, "args": { "External id": 17108,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038485.905, "dur": 0.315, "args": { "External id": 17109,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038487.006, "dur": 0.327, "args": { "External id": 17110,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038488.066, "dur": 0.196, "args": { "External id": 17111,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038489.025, "dur": 0.193, "args": { "External id": 17112,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038491.770, "dur": 0.219, "args": { "External id": 17113,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038492.732, "dur": 0.197, "args": { "External id": 17114,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038493.661, "dur": 0.199, "args": { "External id": 17115,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038494.602, "dur": 0.193, "args": { "External id": 17116,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038495.570, "dur": 0.199, "args": { "External id": 17117,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038496.511, "dur": 0.193, "args": { "External id": 17118,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038497.457, "dur": 0.199, "args": { "External id": 17119,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038498.401, "dur": 0.193, "args": { "External id": 17120,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038500.793, "dur": 0.198, "args": { "External id": 17121,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038501.742, "dur": 0.193, "args": { "External id": 17122,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038503.108, "dur": 0.297, "args": { "External id": 17123,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038504.192, "dur": 0.320, "args": { "External id": 17124,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038505.248, "dur": 0.301, "args": { "External id": 17125,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038506.304, "dur": 0.287, "args": { "External id": 17126,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038507.326, "dur": 0.199, "args": { "External id": 17127,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038508.278, "dur": 0.193, "args": { "External id": 17128,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038510.857, "dur": 0.201, "args": { "External id": 17129,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038511.801, "dur": 0.205, "args": { "External id": 17130,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038512.737, "dur": 0.199, "args": { "External id": 17131,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038513.691, "dur": 0.193, "args": { "External id": 17132,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038514.625, "dur": 0.199, "args": { "External id": 17133,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038515.562, "dur": 0.194, "args": { "External id": 17134,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038516.527, "dur": 0.199, "args": { "External id": 17135,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038517.575, "dur": 0.193, "args": { "External id": 17136,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038520.742, "dur": 0.198, "args": { "External id": 17137,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038521.777, "dur": 0.205, "args": { "External id": 17138,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038522.785, "dur": 0.199, "args": { "External id": 17139,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038523.732, "dur": 0.194, "args": { "External id": 17140,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038524.754, "dur": 0.199, "args": { "External id": 17141,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038525.860, "dur": 0.198, "args": { "External id": 17142,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038526.795, "dur": 0.197, "args": { "External id": 17143,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038527.806, "dur": 0.200, "args": { "External id": 17144,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038530.372, "dur": 0.210, "args": { "External id": 17145,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038531.339, "dur": 0.193, "args": { "External id": 17146,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038532.347, "dur": 0.213, "args": { "External id": 17147,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10642 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038533.355, "dur": 0.193, "args": { "External id": 17148,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038534.283, "dur": 0.199, "args": { "External id": 17149,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038535.236, "dur": 0.194, "args": { "External id": 17150,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038536.271, "dur": 0.197, "args": { "External id": 17151,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038537.220, "dur": 0.193, "args": { "External id": 17152,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038539.896, "dur": 0.199, "args": { "External id": 17153,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038540.844, "dur": 0.192, "args": { "External id": 17154,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038542.199, "dur": 0.197, "args": { "External id": 17155,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038543.146, "dur": 0.194, "args": { "External id": 17156,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038544.077, "dur": 0.199, "args": { "External id": 17157,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038545.052, "dur": 0.194, "args": { "External id": 17158,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038545.980, "dur": 0.198, "args": { "External id": 17159,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038546.924, "dur": 0.196, "args": { "External id": 17160,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038549.633, "dur": 0.199, "args": { "External id": 17161,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038550.615, "dur": 0.194, "args": { "External id": 17162,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038551.565, "dur": 0.381, "args": { "External id": 17163,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038552.697, "dur": 0.303, "args": { "External id": 17164,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038553.773, "dur": 0.352, "args": { "External id": 17165,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038554.875, "dur": 0.287, "args": { "External id": 17166,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038555.899, "dur": 0.198, "args": { "External id": 17167,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038556.857, "dur": 0.334, "args": { "External id": 17168,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038559.148, "dur": 0.305, "args": { "External id": 17169,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038560.201, "dur": 0.327, "args": { "External id": 17170,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038561.314, "dur": 0.339, "args": { "External id": 17171,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038562.435, "dur": 0.416, "args": { "External id": 17172,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038563.588, "dur": 0.346, "args": { "External id": 17173,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038564.720, "dur": 0.193, "args": { "External id": 17174,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038565.760, "dur": 0.198, "args": { "External id": 17175,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038566.786, "dur": 0.194, "args": { "External id": 17176,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038569.524, "dur": 0.202, "args": { "External id": 17177,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038573.334, "dur": 0.198, "args": { "External id": 17178,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038574.635, "dur": 0.198, "args": { "External id": 17179,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10674 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038575.666, "dur": 0.193, "args": { "External id": 17180,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10675 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038576.737, "dur": 0.198, "args": { "External id": 17181,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038577.833, "dur": 0.193, "args": { "External id": 17182,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10677 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038578.900, "dur": 0.197, "args": { "External id": 17183,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038579.997, "dur": 0.197, "args": { "External id": 17184,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10679 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038582.518, "dur": 0.202, "args": { "External id": 17185,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038583.719, "dur": 0.196, "args": { "External id": 17186,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038584.680, "dur": 0.200, "args": { "External id": 17187,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038585.627, "dur": 0.196, "args": { "External id": 17188,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038586.786, "dur": 0.207, "args": { "External id": 17189,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038587.862, "dur": 0.198, "args": { "External id": 17190,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038589.103, "dur": 0.198, "args": { "External id": 17191,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038590.066, "dur": 0.194, "args": { "External id": 17192,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038592.526, "dur": 0.199, "args": { "External id": 17193,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038593.579, "dur": 0.196, "args": { "External id": 17194,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038596.184, "dur": 0.489, "args": { "External id": 17195,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038597.453, "dur": 0.315, "args": { "External id": 17196,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038598.606, "dur": 0.490, "args": { "External id": 17197,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038599.918, "dur": 0.321, "args": { "External id": 17198,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038600.992, "dur": 0.199, "args": { "External id": 17199,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10694 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038601.955, "dur": 0.293, "args": { "External id": 17200,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038604.372, "dur": 0.333, "args": { "External id": 17201,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038605.479, "dur": 0.324, "args": { "External id": 17202,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038606.537, "dur": 0.201, "args": { "External id": 17203,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038607.516, "dur": 0.193, "args": { "External id": 17204,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038608.444, "dur": 0.197, "args": { "External id": 17205,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038609.381, "dur": 0.195, "args": { "External id": 17206,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038610.336, "dur": 0.235, "args": { "External id": 17207,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038611.319, "dur": 0.212, "args": { "External id": 17208,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038614.025, "dur": 0.199, "args": { "External id": 17209,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038614.976, "dur": 0.192, "args": { "External id": 17210,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038615.915, "dur": 0.200, "args": { "External id": 17211,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652038616.857, "dur": 0.194, "args": { "External id": 17212,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::stack", "pid": 1336759, "tid": 1336759, "ts": 1295652038671.768, "dur": 1450.782, "args": { "External id": 17213,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::stack", "pid": 1336759, "tid": 1336759, "ts": 1295652039123.227, "dur": 925.950, "args": { "External id": 17214,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039131.811, "dur": 7.085, "args": { "External id": 17215,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039135.387, "dur": 2.944, "args": { "External id": 17216,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039139.436, "dur": 3.394, "args": { "External id": 17217,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039140.197, "dur": 2.501, "args": { "External id": 17218,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039143.315, "dur": 3.078, "args": { "External id": 17219,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039145.393, "dur": 0.910, "args": { "External id": 17220,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039146.784, "dur": 1.292, "args": { "External id": 17221,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039147.212, "dur": 0.794, "args": { "External id": 17222,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039149.763, "dur": 4.086, "args": { "External id": 17223,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10718 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039152.984, "dur": 0.800, "args": { "External id": 17224,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039154.264, "dur": 1.424, "args": { "External id": 17225,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10720 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039154.893, "dur": 0.726, "args": { "External id": 17226,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039156.040, "dur": 1.501, "args": { "External id": 17227,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039156.637, "dur": 0.837, "args": { "External id": 17228,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039158.105, "dur": 3.830, "args": { "External id": 17229,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039160.841, "dur": 1.023, "args": { "External id": 17230,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039162.207, "dur": 1.500, "args": { "External id": 17231,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039162.894, "dur": 0.746, "args": { "External id": 17232,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039164.133, "dur": 2.854, "args": { "External id": 17233,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10728 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039164.801, "dur": 1.939, "args": { "External id": 17234,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039167.401, "dur": 2.405, "args": { "External id": 17235,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039169.217, "dur": 0.528, "args": { "External id": 17236,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039170.168, "dur": 1.446, "args": { "External id": 17237,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039170.797, "dur": 0.730, "args": { "External id": 17238,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039173.119, "dur": 4.121, "args": { "External id": 17239,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039176.312, "dur": 0.855, "args": { "External id": 17240,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039177.508, "dur": 1.108, "args": { "External id": 17241,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039177.876, "dur": 0.676, "args": { "External id": 17242,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039178.861, "dur": 1.494, "args": { "External id": 17243,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039179.220, "dur": 1.071, "args": { "External id": 17244,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039180.580, "dur": 2.965, "args": { "External id": 17245,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039182.661, "dur": 0.815, "args": { "External id": 17246,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039183.903, "dur": 1.068, "args": { "External id": 17247,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039184.271, "dur": 0.628, "args": { "External id": 17248,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039185.293, "dur": 2.825, "args": { "External id": 17249,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039185.804, "dur": 2.243, "args": { "External id": 17250,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039188.643, "dur": 2.497, "args": { "External id": 17251,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039190.324, "dur": 0.747, "args": { "External id": 17252,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039191.476, "dur": 1.487, "args": { "External id": 17253,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039192.004, "dur": 0.892, "args": { "External id": 17254,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039195.009, "dur": 4.688, "args": { "External id": 17255,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039198.932, "dur": 0.680, "args": { "External id": 17256,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039200.201, "dur": 1.158, "args": { "External id": 17257,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039200.685, "dur": 0.612, "args": { "External id": 17258,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039201.710, "dur": 1.546, "args": { "External id": 17259,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039202.211, "dur": 0.977, "args": { "External id": 17260,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039203.479, "dur": 3.574, "args": { "External id": 17261,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039206.090, "dur": 0.894, "args": { "External id": 17262,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039207.496, "dur": 1.035, "args": { "External id": 17263,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039207.898, "dur": 0.565, "args": { "External id": 17264,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039208.859, "dur": 1.966, "args": { "External id": 17265,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039209.230, "dur": 1.524, "args": { "External id": 17266,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039211.188, "dur": 2.844, "args": { "External id": 17267,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039213.162, "dur": 0.801, "args": { "External id": 17268,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039214.511, "dur": 1.388, "args": { "External id": 17269,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039214.989, "dur": 0.847, "args": { "External id": 17270,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039217.530, "dur": 4.166, "args": { "External id": 17271,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039220.758, "dur": 0.866, "args": { "External id": 17272,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039221.940, "dur": 1.374, "args": { "External id": 17273,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039222.468, "dur": 0.768, "args": { "External id": 17274,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039223.541, "dur": 1.026, "args": { "External id": 17275,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039223.895, "dur": 0.605, "args": { "External id": 17276,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039224.913, "dur": 2.934, "args": { "External id": 17277,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039227.004, "dur": 0.775, "args": { "External id": 17278,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039228.073, "dur": 15.707, "args": { "External id": 17279,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039242.957, "dur": 0.559, "args": { "External id": 17280,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039244.196, "dur": 2.454, "args": { "External id": 17281,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039244.596, "dur": 1.972, "args": { "External id": 17282,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039247.027, "dur": 4.225, "args": { "External id": 17283,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039250.523, "dur": 0.647, "args": { "External id": 17284,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039251.827, "dur": 2.566, "args": { "External id": 17285,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039252.375, "dur": 1.946, "args": { "External id": 17286,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039256.069, "dur": 2.417, "args": { "External id": 17287,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039257.802, "dur": 0.606, "args": { "External id": 17288,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039258.716, "dur": 1.133, "args": { "External id": 17289,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039259.082, "dur": 0.688, "args": { "External id": 17290,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039260.214, "dur": 3.030, "args": { "External id": 17291,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039262.586, "dur": 0.588, "args": { "External id": 17292,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039263.491, "dur": 2.430, "args": { "External id": 17293,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039265.319, "dur": 0.524, "args": { "External id": 17294,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039266.146, "dur": 1.560, "args": { "External id": 17295,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039266.692, "dur": 0.945, "args": { "External id": 17296,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039267.935, "dur": 2.706, "args": { "External id": 17297,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039269.867, "dur": 0.704, "args": { "External id": 17298,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039270.998, "dur": 1.244, "args": { "External id": 17299,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039271.511, "dur": 0.659, "args": { "External id": 17300,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039272.581, "dur": 2.364, "args": { "External id": 17301,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039272.968, "dur": 1.906, "args": { "External id": 17302,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039276.556, "dur": 1.705, "args": { "External id": 17303,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039277.452, "dur": 0.739, "args": { "External id": 17304,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039278.643, "dur": 1.245, "args": { "External id": 17305,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039279.030, "dur": 0.793, "args": { "External id": 17306,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039280.249, "dur": 2.678, "args": { "External id": 17307,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039282.334, "dur": 0.520, "args": { "External id": 17308,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039283.306, "dur": 1.772, "args": { "External id": 17309,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039284.413, "dur": 0.594, "args": { "External id": 17310,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039285.373, "dur": 1.546, "args": { "External id": 17311,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039286.070, "dur": 0.778, "args": { "External id": 17312,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039287.247, "dur": 2.928, "args": { "External id": 17313,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039289.400, "dur": 0.707, "args": { "External id": 17314,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039290.640, "dur": 1.501, "args": { "External id": 17315,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039291.586, "dur": 0.487, "args": { "External id": 17316,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039292.365, "dur": 2.634, "args": { "External id": 17317,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039292.963, "dur": 1.967, "args": { "External id": 17318,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039296.660, "dur": 1.516, "args": { "External id": 17319,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039297.256, "dur": 0.855, "args": { "External id": 17320,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039298.614, "dur": 0.962, "args": { "External id": 17321,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039298.983, "dur": 0.528, "args": { "External id": 17322,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039299.804, "dur": 2.796, "args": { "External id": 17323,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039301.911, "dur": 0.623, "args": { "External id": 17324,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039302.846, "dur": 1.644, "args": { "External id": 17325,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039303.783, "dur": 0.636, "args": { "External id": 17326,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039304.892, "dur": 1.772, "args": { "External id": 17327,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039305.414, "dur": 1.182, "args": { "External id": 17328,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039306.992, "dur": 3.239, "args": { "External id": 17329,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039309.312, "dur": 0.853, "args": { "External id": 17330,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039310.555, "dur": 2.502, "args": { "External id": 17331,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039311.984, "dur": 1.004, "args": { "External id": 17332,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039313.472, "dur": 2.429, "args": { "External id": 17333,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039314.078, "dur": 1.752, "args": { "External id": 17334,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039317.713, "dur": 1.566, "args": { "External id": 17335,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039318.620, "dur": 0.593, "args": { "External id": 17336,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039319.507, "dur": 1.284, "args": { "External id": 17337,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039320.052, "dur": 0.673, "args": { "External id": 17338,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039321.322, "dur": 2.860, "args": { "External id": 17339,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039323.599, "dur": 0.517, "args": { "External id": 17340,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039324.549, "dur": 1.875, "args": { "External id": 17341,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039325.790, "dur": 0.566, "args": { "External id": 17342,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039326.781, "dur": 1.857, "args": { "External id": 17343,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039327.503, "dur": 1.068, "args": { "External id": 17344,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039328.867, "dur": 2.550, "args": { "External id": 17345,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039330.650, "dur": 0.704, "args": { "External id": 17346,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039331.643, "dur": 1.621, "args": { "External id": 17347,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039332.318, "dur": 0.886, "args": { "External id": 17348,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039333.492, "dur": 2.592, "args": { "External id": 17349,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039334.054, "dur": 1.962, "args": { "External id": 17350,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039337.976, "dur": 1.815, "args": { "External id": 17351,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039338.818, "dur": 0.909, "args": { "External id": 17352,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039340.151, "dur": 1.099, "args": { "External id": 17353,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039340.528, "dur": 0.659, "args": { "External id": 17354,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039341.610, "dur": 2.798, "args": { "External id": 17355,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039343.729, "dur": 0.617, "args": { "External id": 17356,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039344.652, "dur": 2.101, "args": { "External id": 17357,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039345.691, "dur": 0.999, "args": { "External id": 17358,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039347.008, "dur": 1.296, "args": { "External id": 17359,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039347.383, "dur": 0.854, "args": { "External id": 17360,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039348.530, "dur": 2.640, "args": { "External id": 17361,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039350.390, "dur": 0.711, "args": { "External id": 17362,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039351.393, "dur": 1.397, "args": { "External id": 17363,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039352.108, "dur": 0.616, "args": { "External id": 17364,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039353.056, "dur": 2.220, "args": { "External id": 17365,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039353.453, "dur": 1.750, "args": { "External id": 17366,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039356.914, "dur": 1.357, "args": { "External id": 17367,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039357.624, "dur": 0.582, "args": { "External id": 17368,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039358.496, "dur": 1.131, "args": { "External id": 17369,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039358.876, "dur": 0.687, "args": { "External id": 17370,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039359.990, "dur": 3.288, "args": { "External id": 17371,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039362.551, "dur": 0.652, "args": { "External id": 17372,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039363.571, "dur": 1.632, "args": { "External id": 17373,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039364.356, "dur": 0.781, "args": { "External id": 17374,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039365.428, "dur": 1.356, "args": { "External id": 17375,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039365.821, "dur": 0.896, "args": { "External id": 17376,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039367.154, "dur": 2.521, "args": { "External id": 17377,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039368.915, "dur": 0.694, "args": { "External id": 17378,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039369.918, "dur": 1.191, "args": { "External id": 17379,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039370.445, "dur": 0.602, "args": { "External id": 17380,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039371.341, "dur": 2.006, "args": { "External id": 17381,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039371.691, "dur": 1.587, "args": { "External id": 17382,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039375.355, "dur": 1.206, "args": { "External id": 17383,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039375.910, "dur": 0.582, "args": { "External id": 17384,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039376.786, "dur": 1.325, "args": { "External id": 17385,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039377.155, "dur": 0.885, "args": { "External id": 17386,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039378.335, "dur": 2.734, "args": { "External id": 17387,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039380.322, "dur": 0.671, "args": { "External id": 17388,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039381.441, "dur": 1.199, "args": { "External id": 17389,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039382.022, "dur": 0.550, "args": { "External id": 17390,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039383.003, "dur": 1.515, "args": { "External id": 17391,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039383.555, "dur": 0.885, "args": { "External id": 17392,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039384.865, "dur": 3.302, "args": { "External id": 17393,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039387.114, "dur": 0.981, "args": { "External id": 17394,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039388.487, "dur": 1.622, "args": { "External id": 17395,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039389.270, "dur": 0.775, "args": { "External id": 17396,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039390.543, "dur": 2.781, "args": { "External id": 17397,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039391.248, "dur": 2.006, "args": { "External id": 17398,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039395.215, "dur": 1.579, "args": { "External id": 17399,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039395.885, "dur": 0.841, "args": { "External id": 17400,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039397.174, "dur": 1.215, "args": { "External id": 17401,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039397.565, "dur": 0.757, "args": { "External id": 17402,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039398.629, "dur": 2.757, "args": { "External id": 17403,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039400.608, "dur": 0.718, "args": { "External id": 17404,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039401.674, "dur": 1.185, "args": { "External id": 17405,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039402.147, "dur": 0.647, "args": { "External id": 17406,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039403.078, "dur": 1.162, "args": { "External id": 17407,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039403.431, "dur": 0.744, "args": { "External id": 17408,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039428.620, "dur": 3.356, "args": { "External id": 23553,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039430.562, "dur": 1.344, "args": { "External id": 23554,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039432.285, "dur": 1.130, "args": { "External id": 23555,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039432.774, "dur": 0.570, "args": { "External id": 23556,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039433.704, "dur": 2.539, "args": { "External id": 23557,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039434.593, "dur": 1.577, "args": { "External id": 23558,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039438.152, "dur": 1.457, "args": { "External id": 23559,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10910 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039439.091, "dur": 0.447, "args": { "External id": 23560,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039439.858, "dur": 2.053, "args": { "External id": 23561,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039441.022, "dur": 0.816, "args": { "External id": 23562,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039442.163, "dur": 3.095, "args": { "External id": 23563,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039444.671, "dur": 0.517, "args": { "External id": 23564,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039445.529, "dur": 2.120, "args": { "External id": 23565,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039446.871, "dur": 0.712, "args": { "External id": 23566,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039448.097, "dur": 1.816, "args": { "External id": 23567,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039449.037, "dur": 0.805, "args": { "External id": 23568,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039450.167, "dur": 3.332, "args": { "External id": 23569,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039452.635, "dur": 0.798, "args": { "External id": 23570,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039453.754, "dur": 1.061, "args": { "External id": 23571,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039454.243, "dur": 0.504, "args": { "External id": 23572,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039455.064, "dur": 2.351, "args": { "External id": 23573,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039455.518, "dur": 1.816, "args": { "External id": 23574,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039459.041, "dur": 1.052, "args": { "External id": 23575,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039459.451, "dur": 0.577, "args": { "External id": 23576,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039460.571, "dur": 1.053, "args": { "External id": 23577,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039461.016, "dur": 0.535, "args": { "External id": 23578,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039462.080, "dur": 2.506, "args": { "External id": 23579,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039463.936, "dur": 0.572, "args": { "External id": 23580,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039464.875, "dur": 1.104, "args": { "External id": 23581,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039465.316, "dur": 0.593, "args": { "External id": 23582,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039466.225, "dur": 1.248, "args": { "External id": 23583,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039466.633, "dur": 0.768, "args": { "External id": 23584,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039467.730, "dur": 2.313, "args": { "External id": 23585,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039469.552, "dur": 0.425, "args": { "External id": 23586,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039470.341, "dur": 0.976, "args": { "External id": 23587,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039470.783, "dur": 0.470, "args": { "External id": 23588,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039471.564, "dur": 2.911, "args": { "External id": 23589,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039471.981, "dur": 2.416, "args": { "External id": 23590,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039476.421, "dur": 1.195, "args": { "External id": 23591,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039476.842, "dur": 0.704, "args": { "External id": 23592,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039477.865, "dur": 1.481, "args": { "External id": 23593,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039478.275, "dur": 0.999, "args": { "External id": 23594,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039479.597, "dur": 2.600, "args": { "External id": 23595,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039481.523, "dur": 0.603, "args": { "External id": 23596,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039482.466, "dur": 1.099, "args": { "External id": 23597,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039482.875, "dur": 0.622, "args": { "External id": 23598,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039483.967, "dur": 1.198, "args": { "External id": 23599,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039484.385, "dur": 0.705, "args": { "External id": 23600,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039485.416, "dur": 2.208, "args": { "External id": 23601,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039487.145, "dur": 0.413, "args": { "External id": 23602,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039487.873, "dur": 1.023, "args": { "External id": 23603,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039488.276, "dur": 0.553, "args": { "External id": 23604,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039489.162, "dur": 2.662, "args": { "External id": 23605,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039489.614, "dur": 2.131, "args": { "External id": 23606,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039493.222, "dur": 1.120, "args": { "External id": 23607,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039493.646, "dur": 0.631, "args": { "External id": 23608,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039494.791, "dur": 1.147, "args": { "External id": 23609,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039495.209, "dur": 0.658, "args": { "External id": 23610,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039496.355, "dur": 2.407, "args": { "External id": 23611,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039498.208, "dur": 0.482, "args": { "External id": 23612,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039499.031, "dur": 0.947, "args": { "External id": 23613,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039499.468, "dur": 0.447, "args": { "External id": 23614,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039500.244, "dur": 1.140, "args": { "External id": 23615,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039500.683, "dur": 0.627, "args": { "External id": 23616,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039501.632, "dur": 2.647, "args": { "External id": 23617,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039503.758, "dur": 0.450, "args": { "External id": 23618,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039504.530, "dur": 1.172, "args": { "External id": 23619,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039504.971, "dur": 0.664, "args": { "External id": 23620,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039505.961, "dur": 2.394, "args": { "External id": 23621,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039506.641, "dur": 1.634, "args": { "External id": 23622,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039510.214, "dur": 1.458, "args": { "External id": 23623,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039511.002, "dur": 0.606, "args": { "External id": 23624,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039511.924, "dur": 1.249, "args": { "External id": 23625,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039512.590, "dur": 0.510, "args": { "External id": 23626,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039513.548, "dur": 2.970, "args": { "External id": 23627,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039515.813, "dur": 0.637, "args": { "External id": 23628,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039516.786, "dur": 1.112, "args": { "External id": 23629,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039517.574, "dur": 0.252, "args": { "External id": 23630,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039518.296, "dur": 1.431, "args": { "External id": 23631,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039519.067, "dur": 0.587, "args": { "External id": 23632,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039519.980, "dur": 2.541, "args": { "External id": 23633,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039522.174, "dur": 0.271, "args": { "External id": 23634,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039522.777, "dur": 1.122, "args": { "External id": 23635,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039523.422, "dur": 0.410, "args": { "External id": 23636,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039524.148, "dur": 2.316, "args": { "External id": 23637,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039524.877, "dur": 1.510, "args": { "External id": 23638,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039528.486, "dur": 1.348, "args": { "External id": 23639,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039529.131, "dur": 0.640, "args": { "External id": 23640,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039530.268, "dur": 1.133, "args": { "External id": 23641,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039530.974, "dur": 0.353, "args": { "External id": 23642,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039531.691, "dur": 2.066, "args": { "External id": 23643,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039533.473, "dur": 0.211, "args": { "External id": 23644,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039534.058, "dur": 1.291, "args": { "External id": 23645,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039534.628, "dur": 0.651, "args": { "External id": 23646,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039535.600, "dur": 1.706, "args": { "External id": 23647,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039536.513, "dur": 0.691, "args": { "External id": 23648,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039537.670, "dur": 2.469, "args": { "External id": 23649,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039539.728, "dur": 0.338, "args": { "External id": 23650,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039540.405, "dur": 1.259, "args": { "External id": 23651,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039541.274, "dur": 0.314, "args": { "External id": 23652,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039541.913, "dur": 2.754, "args": { "External id": 23653,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039542.803, "dur": 1.784, "args": { "External id": 23654,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039546.341, "dur": 1.294, "args": { "External id": 23655,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039547.214, "dur": 0.346, "args": { "External id": 23656,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039547.892, "dur": 1.054, "args": { "External id": 23657,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039548.535, "dur": 0.337, "args": { "External id": 23658,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039549.194, "dur": 2.501, "args": { "External id": 23659,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039551.209, "dur": 0.423, "args": { "External id": 23660,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039551.965, "dur": 1.071, "args": { "External id": 23661,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039552.692, "dur": 0.270, "args": { "External id": 23662,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039553.285, "dur": 1.107, "args": { "External id": 23663,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039553.947, "dur": 0.370, "args": { "External id": 23664,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11015 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039554.642, "dur": 2.623, "args": { "External id": 23665,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039556.698, "dur": 0.504, "args": { "External id": 23666,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039557.525, "dur": 1.395, "args": { "External id": 23667,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11018 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039558.385, "dur": 0.467, "args": { "External id": 23668,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039559.168, "dur": 2.390, "args": { "External id": 23669,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039559.852, "dur": 1.629, "args": { "External id": 23670,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039563.178, "dur": 1.243, "args": { "External id": 23671,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039563.961, "dur": 0.388, "args": { "External id": 23672,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039564.685, "dur": 1.153, "args": { "External id": 23673,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039565.336, "dur": 0.430, "args": { "External id": 23674,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039566.091, "dur": 2.308, "args": { "External id": 23675,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039567.905, "dur": 0.425, "args": { "External id": 23676,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039568.672, "dur": 1.332, "args": { "External id": 23677,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039569.431, "dur": 0.502, "args": { "External id": 23678,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039570.255, "dur": 1.270, "args": { "External id": 23679,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039570.928, "dur": 0.528, "args": { "External id": 23680,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039571.771, "dur": 2.616, "args": { "External id": 23681,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039573.945, "dur": 0.371, "args": { "External id": 23682,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039574.653, "dur": 2.377, "args": { "External id": 23683,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039576.429, "dur": 0.525, "args": { "External id": 23684,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039577.317, "dur": 2.467, "args": { "External id": 23685,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039578.058, "dur": 1.648, "args": { "External id": 23686,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039581.751, "dur": 1.527, "args": { "External id": 23687,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039582.627, "dur": 0.579, "args": { "External id": 23688,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039583.525, "dur": 1.696, "args": { "External id": 23689,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039584.398, "dur": 0.750, "args": { "External id": 23690,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039585.495, "dur": 2.668, "args": { "External id": 23691,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039587.743, "dur": 0.345, "args": { "External id": 23692,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039588.432, "dur": 1.198, "args": { "External id": 23693,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039589.132, "dur": 0.431, "args": { "External id": 23694,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039589.882, "dur": 1.396, "args": { "External id": 23695,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039590.703, "dur": 0.502, "args": { "External id": 23696,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039591.529, "dur": 2.927, "args": { "External id": 23697,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039593.952, "dur": 0.431, "args": { "External id": 23698,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039594.740, "dur": 1.416, "args": { "External id": 23699,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039595.550, "dur": 0.424, "args": { "External id": 23700,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039596.412, "dur": 2.457, "args": { "External id": 23701,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039597.183, "dur": 1.606, "args": { "External id": 23702,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039600.578, "dur": 1.083, "args": { "External id": 23703,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039601.294, "dur": 0.295, "args": { "External id": 23704,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039602.149, "dur": 1.154, "args": { "External id": 23705,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039602.796, "dur": 0.434, "args": { "External id": 23706,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039603.569, "dur": 2.321, "args": { "External id": 23707,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039605.476, "dur": 0.340, "args": { "External id": 23708,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039606.180, "dur": 1.447, "args": { "External id": 23709,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039606.917, "dur": 0.639, "args": { "External id": 23710,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039607.876, "dur": 1.187, "args": { "External id": 23711,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039608.567, "dur": 0.422, "args": { "External id": 23712,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039609.311, "dur": 2.852, "args": { "External id": 23713,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039611.679, "dur": 0.414, "args": { "External id": 23714,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039612.413, "dur": 1.032, "args": { "External id": 23715,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039613.098, "dur": 0.272, "args": { "External id": 23716,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039613.732, "dur": 2.702, "args": { "External id": 23717,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039614.487, "dur": 1.869, "args": { "External id": 23718,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039618.374, "dur": 1.209, "args": { "External id": 23719,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039619.003, "dur": 0.512, "args": { "External id": 23720,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039619.840, "dur": 1.192, "args": { "External id": 23721,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039620.558, "dur": 0.400, "args": { "External id": 23722,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039621.282, "dur": 2.835, "args": { "External id": 23723,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039623.716, "dur": 0.328, "args": { "External id": 23724,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039624.395, "dur": 1.141, "args": { "External id": 23725,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039625.047, "dur": 0.261, "args": { "External id": 23726,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039625.828, "dur": 1.153, "args": { "External id": 23727,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039626.535, "dur": 0.373, "args": { "External id": 23728,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039627.263, "dur": 2.814, "args": { "External id": 23729,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039629.266, "dur": 0.736, "args": { "External id": 23730,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039630.427, "dur": 1.316, "args": { "External id": 23731,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039631.065, "dur": 0.609, "args": { "External id": 23732,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039632.011, "dur": 2.854, "args": { "External id": 23733,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039632.912, "dur": 1.767, "args": { "External id": 23734,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039636.876, "dur": 1.313, "args": { "External id": 23735,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039637.459, "dur": 0.464, "args": { "External id": 23736,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039638.438, "dur": 1.627, "args": { "External id": 23737,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039639.174, "dur": 0.589, "args": { "External id": 23738,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039640.352, "dur": 2.566, "args": { "External id": 23739,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039642.503, "dur": 0.340, "args": { "External id": 23740,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039643.261, "dur": 1.090, "args": { "External id": 23741,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039643.942, "dur": 0.336, "args": { "External id": 23742,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039644.600, "dur": 1.569, "args": { "External id": 23743,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039645.413, "dur": 0.684, "args": { "External id": 23744,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039646.418, "dur": 2.656, "args": { "External id": 23745,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039648.425, "dur": 0.585, "args": { "External id": 23746,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039649.349, "dur": 1.129, "args": { "External id": 23747,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039650.070, "dur": 0.333, "args": { "External id": 23748,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039650.727, "dur": 2.673, "args": { "External id": 23749,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039651.563, "dur": 1.762, "args": { "External id": 23750,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039655.147, "dur": 1.249, "args": { "External id": 23751,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039655.988, "dur": 0.331, "args": { "External id": 23752,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039656.992, "dur": 1.382, "args": { "External id": 23753,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039657.740, "dur": 0.419, "args": { "External id": 23754,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039658.652, "dur": 2.709, "args": { "External id": 23755,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039661.032, "dur": 0.254, "args": { "External id": 23756,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039661.671, "dur": 1.113, "args": { "External id": 23757,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039662.308, "dur": 0.412, "args": { "External id": 23758,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039663.054, "dur": 1.410, "args": { "External id": 23759,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039663.980, "dur": 0.411, "args": { "External id": 23760,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039664.731, "dur": 2.444, "args": { "External id": 23761,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039666.799, "dur": 0.299, "args": { "External id": 23762,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039667.444, "dur": 1.249, "args": { "External id": 23763,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039668.260, "dur": 0.239, "args": { "External id": 23764,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039668.957, "dur": 2.643, "args": { "External id": 23765,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039669.760, "dur": 1.637, "args": { "External id": 23766,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039673.673, "dur": 1.206, "args": { "External id": 23767,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039674.403, "dur": 0.290, "args": { "External id": 23768,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039675.127, "dur": 1.262, "args": { "External id": 23769,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039675.698, "dur": 0.619, "args": { "External id": 23770,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039676.638, "dur": 2.669, "args": { "External id": 23771,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11122 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039678.932, "dur": 0.301, "args": { "External id": 23772,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039679.584, "dur": 1.164, "args": { "External id": 23773,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039680.376, "dur": 0.297, "args": { "External id": 23774,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039680.998, "dur": 1.207, "args": { "External id": 23775,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039681.769, "dur": 0.367, "args": { "External id": 23776,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039682.455, "dur": 2.885, "args": { "External id": 23777,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039684.612, "dur": 0.523, "args": { "External id": 23778,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039685.639, "dur": 1.467, "args": { "External id": 23779,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039686.424, "dur": 0.485, "args": { "External id": 23780,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039687.396, "dur": 2.527, "args": { "External id": 23781,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039688.177, "dur": 1.667, "args": { "External id": 23782,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039691.465, "dur": 1.072, "args": { "External id": 23783,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039692.224, "dur": 0.240, "args": { "External id": 23784,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039692.789, "dur": 1.469, "args": { "External id": 23785,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039693.584, "dur": 0.600, "args": { "External id": 23786,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039694.513, "dur": 2.957, "args": { "External id": 23787,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039697.143, "dur": 0.251, "args": { "External id": 23788,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039697.738, "dur": 1.280, "args": { "External id": 23789,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039698.597, "dur": 0.348, "args": { "External id": 23790,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039699.289, "dur": 1.101, "args": { "External id": 23791,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039699.858, "dur": 0.459, "args": { "External id": 23792,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039700.641, "dur": 2.424, "args": { "External id": 23793,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039702.640, "dur": 0.353, "args": { "External id": 23794,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039703.377, "dur": 1.260, "args": { "External id": 23795,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039704.189, "dur": 0.374, "args": { "External id": 23796,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039704.989, "dur": 2.461, "args": { "External id": 23797,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039705.770, "dur": 1.603, "args": { "External id": 23798,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039709.462, "dur": 1.393, "args": { "External id": 23799,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039710.203, "dur": 0.584, "args": { "External id": 23800,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039711.250, "dur": 1.131, "args": { "External id": 23801,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039711.981, "dur": 0.329, "args": { "External id": 23802,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039712.640, "dur": 2.753, "args": { "External id": 23803,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039715.035, "dur": 0.285, "args": { "External id": 23804,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039715.691, "dur": 1.289, "args": { "External id": 23805,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039716.436, "dur": 0.480, "args": { "External id": 23806,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039717.229, "dur": 1.385, "args": { "External id": 23807,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039717.916, "dur": 0.627, "args": { "External id": 23808,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039718.870, "dur": 3.104, "args": { "External id": 23809,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039721.284, "dur": 0.618, "args": { "External id": 23810,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039722.241, "dur": 0.932, "args": { "External id": 23811,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039722.872, "dur": 0.228, "args": { "External id": 23812,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039723.426, "dur": 2.503, "args": { "External id": 23813,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039724.005, "dur": 1.697, "args": { "External id": 23814,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039728.184, "dur": 1.202, "args": { "External id": 23815,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039728.962, "dur": 0.349, "args": { "External id": 23816,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039729.637, "dur": 0.956, "args": { "External id": 23817,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039730.182, "dur": 0.340, "args": { "External id": 23818,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039730.845, "dur": 2.490, "args": { "External id": 23819,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039732.988, "dur": 0.274, "args": { "External id": 23820,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039733.604, "dur": 0.996, "args": { "External id": 23821,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039734.192, "dur": 0.336, "args": { "External id": 23822,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039734.847, "dur": 1.228, "args": { "External id": 23823,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039735.520, "dur": 0.482, "args": { "External id": 23824,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11175 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039736.324, "dur": 2.793, "args": { "External id": 23825,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11176 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039738.580, "dur": 0.320, "args": { "External id": 23826,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039739.373, "dur": 1.096, "args": { "External id": 23827,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039740.092, "dur": 0.308, "args": { "External id": 23828,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039740.729, "dur": 2.295, "args": { "External id": 23829,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039741.306, "dur": 1.647, "args": { "External id": 23830,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039744.627, "dur": 1.393, "args": { "External id": 23831,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039745.386, "dur": 0.241, "args": { "External id": 23832,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039746.273, "dur": 1.389, "args": { "External id": 23833,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039746.904, "dur": 0.538, "args": { "External id": 23834,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039747.912, "dur": 2.481, "args": { "External id": 23835,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039749.970, "dur": 0.351, "args": { "External id": 23836,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039750.666, "dur": 1.414, "args": { "External id": 23837,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039751.427, "dur": 0.586, "args": { "External id": 23838,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039752.331, "dur": 1.224, "args": { "External id": 23839,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039752.973, "dur": 0.516, "args": { "External id": 23840,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039753.806, "dur": 2.150, "args": { "External id": 23841,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039755.575, "dur": 0.305, "args": { "External id": 23842,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039756.232, "dur": 0.864, "args": { "External id": 23843,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039756.811, "dur": 0.210, "args": { "External id": 23844,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039757.346, "dur": 2.281, "args": { "External id": 23845,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039757.975, "dur": 1.579, "args": { "External id": 23846,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039761.280, "dur": 1.162, "args": { "External id": 23847,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039762.041, "dur": 0.338, "args": { "External id": 23848,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039762.695, "dur": 1.191, "args": { "External id": 23849,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039763.444, "dur": 0.370, "args": { "External id": 23850,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039764.132, "dur": 2.463, "args": { "External id": 23851,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039766.249, "dur": 0.277, "args": { "External id": 23852,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039766.868, "dur": 1.139, "args": { "External id": 23853,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039767.607, "dur": 0.330, "args": { "External id": 23854,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039768.257, "dur": 1.276, "args": { "External id": 23855,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039768.954, "dur": 0.331, "args": { "External id": 23856,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039769.802, "dur": 2.911, "args": { "External id": 23857,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039772.088, "dur": 0.268, "args": { "External id": 23858,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039772.980, "dur": 1.126, "args": { "External id": 23859,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039773.780, "dur": 0.258, "args": { "External id": 23860,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039774.362, "dur": 2.476, "args": { "External id": 23861,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039775.012, "dur": 1.557, "args": { "External id": 23862,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039778.493, "dur": 1.022, "args": { "External id": 23863,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039779.162, "dur": 0.285, "args": { "External id": 23864,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039779.773, "dur": 1.264, "args": { "External id": 23865,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039780.479, "dur": 0.336, "args": { "External id": 23866,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039781.318, "dur": 2.653, "args": { "External id": 23867,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039783.601, "dur": 0.292, "args": { "External id": 23868,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039784.262, "dur": 0.965, "args": { "External id": 23869,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039784.834, "dur": 0.325, "args": { "External id": 23870,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039785.530, "dur": 1.201, "args": { "External id": 23871,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039786.366, "dur": 0.299, "args": { "External id": 23872,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039786.996, "dur": 2.351, "args": { "External id": 23873,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039789.044, "dur": 0.237, "args": { "External id": 23874,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039789.659, "dur": 1.332, "args": { "External id": 23875,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039790.405, "dur": 0.509, "args": { "External id": 23876,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039791.247, "dur": 2.514, "args": { "External id": 23877,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039791.947, "dur": 1.734, "args": { "External id": 23878,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039795.802, "dur": 1.212, "args": { "External id": 23879,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039796.514, "dur": 0.311, "args": { "External id": 23880,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039797.372, "dur": 1.166, "args": { "External id": 23881,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039798.121, "dur": 0.351, "args": { "External id": 23882,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039798.818, "dur": 2.752, "args": { "External id": 23883,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039801.234, "dur": 0.270, "args": { "External id": 23884,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039801.840, "dur": 1.105, "args": { "External id": 23885,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039802.567, "dur": 0.314, "args": { "External id": 23886,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039803.304, "dur": 1.236, "args": { "External id": 23887,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039804.240, "dur": 0.231, "args": { "External id": 23888,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039804.790, "dur": 2.698, "args": { "External id": 23889,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039807.094, "dur": 0.326, "args": { "External id": 23890,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039807.751, "dur": 1.240, "args": { "External id": 23891,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039808.432, "dur": 0.300, "args": { "External id": 23892,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039809.239, "dur": 2.761, "args": { "External id": 23893,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039809.968, "dur": 1.958, "args": { "External id": 23894,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039814.037, "dur": 1.080, "args": { "External id": 23895,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039814.717, "dur": 0.332, "args": { "External id": 23896,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039815.372, "dur": 1.150, "args": { "External id": 23897,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039816.048, "dur": 0.403, "args": { "External id": 23898,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039816.768, "dur": 2.609, "args": { "External id": 23899,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039819.028, "dur": 0.280, "args": { "External id": 23900,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039819.691, "dur": 1.339, "args": { "External id": 23901,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039820.410, "dur": 0.345, "args": { "External id": 23902,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039821.284, "dur": 1.091, "args": { "External id": 23903,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039821.964, "dur": 0.342, "args": { "External id": 23904,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039822.680, "dur": 3.008, "args": { "External id": 23905,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039825.406, "dur": 0.210, "args": { "External id": 23906,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039826.023, "dur": 1.167, "args": { "External id": 23907,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039826.826, "dur": 0.296, "args": { "External id": 23908,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039827.466, "dur": 2.130, "args": { "External id": 23909,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039828.092, "dur": 1.431, "args": { "External id": 23910,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039830.979, "dur": 1.044, "args": { "External id": 23911,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039831.653, "dur": 0.303, "args": { "External id": 23912,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039832.367, "dur": 1.054, "args": { "External id": 23913,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039832.964, "dur": 0.386, "args": { "External id": 23914,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039833.688, "dur": 2.729, "args": { "External id": 23915,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039836.046, "dur": 0.301, "args": { "External id": 23916,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039836.711, "dur": 1.165, "args": { "External id": 23917,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039837.516, "dur": 0.290, "args": { "External id": 23918,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039838.148, "dur": 1.147, "args": { "External id": 23919,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039838.908, "dur": 0.321, "args": { "External id": 23920,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039839.562, "dur": 2.248, "args": { "External id": 23921,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039841.469, "dur": 0.273, "args": { "External id": 23922,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039842.066, "dur": 1.016, "args": { "External id": 23923,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039842.734, "dur": 0.281, "args": { "External id": 23924,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039843.368, "dur": 2.551, "args": { "External id": 23925,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039844.117, "dur": 1.595, "args": { "External id": 23926,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039847.748, "dur": 1.110, "args": { "External id": 23927,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039848.454, "dur": 0.336, "args": { "External id": 23928,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039849.108, "dur": 1.221, "args": { "External id": 23929,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039849.844, "dur": 0.416, "args": { "External id": 23930,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039850.579, "dur": 2.598, "args": { "External id": 23931,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039852.796, "dur": 0.314, "args": { "External id": 23932,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039853.450, "dur": 1.098, "args": { "External id": 23933,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039854.194, "dur": 0.284, "args": { "External id": 23934,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039854.799, "dur": 1.143, "args": { "External id": 23935,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039855.508, "dur": 0.367, "args": { "External id": 23936,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039856.192, "dur": 2.678, "args": { "External id": 23937,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039858.537, "dur": 0.266, "args": { "External id": 23938,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336759, "tid": 1336759, "ts": 1295652039859.137, "dur": 1.986, "args": { "External id": 23939,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652039860.697, "dur": 0.359, "args": { "External id": 23940,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::cat", "pid": 1336759, "tid": 1336759, "ts": 1295652039879.451, "dur": 157.769, "args": { "External id": 23941,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linalg_vector_norm", "pid": 1336759, "tid": 1336759, "ts": 1295652040137.892, "dur": 146.723, "args": { "External id": 23942,"Record function id": 0, "Concrete Inputs": ["", "2.", "", "False", ""], "Input type": ["float", "Scalar", "", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[291], [], [], [], []], "Ev Idx": 11293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linalg_vector_norm", "pid": 1336759, "tid": 1336759, "ts": 1295652040198.301, "dur": 63.386, "args": { "External id": 23943,"Record function id": 0, "Concrete Inputs": ["", "2.", "", "False", ""], "Input type": ["float", "Scalar", "", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[291], [], [], [], []], "Ev Idx": 11294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336759, "tid": 1336759, "ts": 1295652040214.654, "dur": 1.109, "args": { "External id": 23944,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11295 } }, { "ph": "X", "cat": "cpu_op", "name": "Redistribute", "pid": 1336759, "tid": 1336759, "ts": 1295652040618.003, "dur": 952.901, "args": { "External id": 23945,"Sequence number": 246776, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "False"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::pow", "pid": 1336759, "tid": 1336759, "ts": 1295652040668.977, "dur": 92.427, "args": { "External id": 23946,"Record function id": 0, "Concrete Inputs": ["", "2."], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652040674.416, "dur": 1.459, "args": { "External id": 23947,"Record function id": 0, "Concrete Inputs": ["", "2."], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652040721.186, "dur": 0.867, "args": { "External id": 23948,"Record function id": 0, "Concrete Inputs": ["", "6", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 11299 } }, { "ph": "X", "cat": "cpu_op", "name": "_c10d_functional::all_reduce", "pid": 1336759, "tid": 1336759, "ts": 1295652040786.847, "dur": 477.360, "args": { "External id": 23949,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["float", "", ""], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 11300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336759, "tid": 1336759, "ts": 1295652040791.419, "dur": 43.154, "args": { "External id": 23950,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336759, "tid": 1336759, "ts": 1295652040794.589, "dur": 10.344, "args": { "External id": 23951,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "0"], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 11302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295652040799.811, "dur": 4.329, "args": { "External id": 23952,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 11303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336759, "tid": 1336759, "ts": 1295652040806.336, "dur": 27.594, "args": { "External id": 23953,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 11304 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::allreduce_", "pid": 1336759, "tid": 1336759, "ts": 1295652040844.660, "dur": 415.378, "args": { "External id": 23954,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "-1"], "Input type": ["TensorList", "", "", "", "Scalar"], "Input Strides": [[[]], [], [], [], []], "Input Dims": [[[]], [], [], [], []], "Ev Idx": 11305 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295652040875.028, "dur": 376.996, "args": { "External id": 23955,"Record function id": 0, "Collective name": "allreduce", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 6, "Input Strides": [[[]], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "6", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1, "Process Group Name": "0", "Input type": ["TensorList", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[[]], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 11306, "In msg nelems": 1 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:all_reduce", "pid": 1336759, "tid": 1336759, "ts": 1295652040890.734, "dur": 354.406, "args": { "External id": 23956,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::pow", "pid": 1336759, "tid": 1336759, "ts": 1295652041328.372, "dur": 207.737, "args": { "External id": 23957,"Record function id": 0, "Concrete Inputs": ["", "0.5"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11308 } }, { "ph": "X", "cat": "cpu_op", "name": "_c10d_functional::wait_tensor", "pid": 1336759, "tid": 1336759, "ts": 1295652041417.284, "dur": 38.746, "args": { "External id": 23958,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11309 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336759, "tid": 1336759, "ts": 1295652041437.999, "dur": 9.490, "args": { "External id": 23959,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "6", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 11310, "In msg nelems": 0, "Rank": 6, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::pow", "pid": 1336759, "tid": 1336759, "ts": 1295652041485.738, "dur": 44.380, "args": { "External id": 23960,"Record function id": 0, "Concrete Inputs": ["", "0.5"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652041488.764, "dur": 1.259, "args": { "External id": 23961,"Record function id": 0, "Concrete Inputs": ["", "0.5"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652041491.576, "dur": 0.589, "args": { "External id": 23962,"Record function id": 0, "Concrete Inputs": ["", "6", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 11313 } }, { "ph": "X", "cat": "cpu_op", "name": "_ToTorchTensor", "pid": 1336759, "tid": 1336759, "ts": 1295652041586.216, "dur": 20.828, "args": { "External id": 23963,"Sequence number": 246777, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336759, "tid": 1336759, "ts": 1295652041595.757, "dur": 8.045, "args": { "External id": 23964,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336759, "tid": 1336759, "ts": 1295652041598.084, "dur": 5.532, "args": { "External id": 23965,"Record function id": 0, "Concrete Inputs": ["", "[]"], "Input type": ["float", "ScalarList"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336759, "tid": 1336759, "ts": 1295652041917.005, "dur": 30.246, "args": { "External id": 23966,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "double", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 11317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reciprocal", "pid": 1336759, "tid": 1336759, "ts": 1295652041956.310, "dur": 21.422, "args": { "External id": 23967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mul", "pid": 1336759, "tid": 1336759, "ts": 1295652042023.526, "dur": 41.439, "args": { "External id": 23968,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "double"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clamp", "pid": 1336759, "tid": 1336759, "ts": 1295652042085.909, "dur": 26.492, "args": { "External id": 23969,"Record function id": 0, "Concrete Inputs": ["", "", "1."], "Input type": ["float", "", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 11320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652042090.315, "dur": 0.666, "args": { "External id": 23970,"Record function id": 0, "Concrete Inputs": ["", "6", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 11321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336759, "tid": 1336759, "ts": 1295652042131.212, "dur": 0.421, "args": { "External id": 23971,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 11322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_mul_", "pid": 1336759, "tid": 1336759, "ts": 1295652042258.841, "dur": 673.807, "args": { "External id": 23972,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["TensorList", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_mul_", "pid": 1336759, "tid": 1336759, "ts": 1295652042743.724, "dur": 158.883, "args": { "External id": 23973,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["TensorList", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::isnan", "pid": 1336759, "tid": 1336759, "ts": 1295652042975.831, "dur": 58.724, "args": { "External id": 23974,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336759, "tid": 1336759, "ts": 1295652042979.808, "dur": 53.907, "args": { "External id": 23975,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336759, "tid": 1336759, "ts": 1295652043039.918, "dur": 1622.254, "args": { "External id": 23976,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336759, "tid": 1336759, "ts": 1295652043041.375, "dur": 1620.514, "args": { "External id": 23977,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336759, "tid": 1336759, "ts": 1295652043043.250, "dur": 1617.742, "args": { "External id": 23978,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::isinf", "pid": 1336759, "tid": 1336759, "ts": 1295652044669.053, "dur": 60.978, "args": { "External id": 23979,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295652044672.456, "dur": 35.094, "args": { "External id": 23980,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336759, "tid": 1336759, "ts": 1295652044679.877, "dur": 3.385, "args": { "External id": 23981,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 11332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336759, "tid": 1336759, "ts": 1295652044685.049, "dur": 22.222, "args": { "External id": 23982,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], [1]], "Input Dims": [[], [0]], "Ev Idx": 11333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336759, "tid": 1336759, "ts": 1295652044690.073, "dur": 2.646, "args": { "External id": 23983,"Record function id": 0, "Concrete Inputs": ["", "[]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 11334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336759, "tid": 1336759, "ts": 1295652044709.159, "dur": 19.952, "args": { "External id": 23984,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336759, "tid": 1336759, "ts": 1295652044732.883, "dur": 36.716, "args": { "External id": 23985,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336759, "tid": 1336759, "ts": 1295652044735.619, "dur": 33.784, "args": { "External id": 23986,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336759, "tid": 1336759, "ts": 1295652044736.528, "dur": 32.586, "args": { "External id": 23987,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11338 } }, { "ph": "X", "cat": "user_annotation", "name": "Optimizer.step#OptimizersContainer.step", "pid": 1336759, "tid": 1336759, "ts": 1295652044796.931, "dur": 5566.282, "args": { "External id": 23988,"Record function id": 0, "Ev Idx": 11339 } }, { "ph": "X", "cat": "user_annotation", "name": "Optimizer.step#AdamW.step", "pid": 1336759, "tid": 1336759, "ts": 1295652044827.941, "dur": 5511.545, "args": { "External id": 23989,"Record function id": 0, "Ev Idx": 11340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_add_", "pid": 1336759, "tid": 1336759, "ts": 1295652045957.828, "dur": 312.671, "args": { "External id": 23990,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652045978.922, "dur": 1.145, "args": { "External id": 23991,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046009.485, "dur": 0.471, "args": { "External id": 23992,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046011.025, "dur": 0.104, "args": { "External id": 23993,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046011.508, "dur": 0.195, "args": { "External id": 23994,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046012.245, "dur": 0.304, "args": { "External id": 23995,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046013.044, "dur": 0.087, "args": { "External id": 23996,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046013.589, "dur": 0.090, "args": { "External id": 23997,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046014.058, "dur": 0.082, "args": { "External id": 23998,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046014.483, "dur": 0.078, "args": { "External id": 23999,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046015.043, "dur": 0.074, "args": { "External id": 24000,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046015.570, "dur": 0.072, "args": { "External id": 24001,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046015.974, "dur": 0.266, "args": { "External id": 24002,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046016.624, "dur": 0.062, "args": { "External id": 24003,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046017.085, "dur": 0.061, "args": { "External id": 24004,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046017.467, "dur": 0.066, "args": { "External id": 24005,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046017.880, "dur": 0.064, "args": { "External id": 24006,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046018.336, "dur": 0.064, "args": { "External id": 24007,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046018.740, "dur": 0.069, "args": { "External id": 24008,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046019.142, "dur": 0.065, "args": { "External id": 24009,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046019.595, "dur": 0.061, "args": { "External id": 24010,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046020.020, "dur": 0.064, "args": { "External id": 24011,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046020.413, "dur": 0.062, "args": { "External id": 24012,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046020.947, "dur": 0.069, "args": { "External id": 24013,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046021.332, "dur": 0.066, "args": { "External id": 24014,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046021.766, "dur": 0.063, "args": { "External id": 24015,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046022.181, "dur": 0.066, "args": { "External id": 24016,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046022.720, "dur": 0.062, "args": { "External id": 24017,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046023.256, "dur": 0.069, "args": { "External id": 24018,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046023.765, "dur": 0.065, "args": { "External id": 24019,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046024.241, "dur": 0.065, "args": { "External id": 24020,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046024.632, "dur": 0.065, "args": { "External id": 24021,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046025.022, "dur": 0.063, "args": { "External id": 24022,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046025.471, "dur": 0.067, "args": { "External id": 24023,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046025.880, "dur": 0.062, "args": { "External id": 24024,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046026.347, "dur": 0.065, "args": { "External id": 24025,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046026.752, "dur": 0.067, "args": { "External id": 24026,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046027.229, "dur": 0.057, "args": { "External id": 24027,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046027.693, "dur": 0.066, "args": { "External id": 24028,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046028.136, "dur": 0.065, "args": { "External id": 24029,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046028.569, "dur": 0.069, "args": { "External id": 24030,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046029.056, "dur": 0.064, "args": { "External id": 24031,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046029.456, "dur": 0.062, "args": { "External id": 24032,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046029.912, "dur": 0.059, "args": { "External id": 24033,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046030.340, "dur": 0.062, "args": { "External id": 24034,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046030.786, "dur": 0.089, "args": { "External id": 24035,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046031.183, "dur": 0.053, "args": { "External id": 24036,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046031.620, "dur": 0.086, "args": { "External id": 24037,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046032.065, "dur": 0.086, "args": { "External id": 24038,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046032.626, "dur": 0.059, "args": { "External id": 24039,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046032.968, "dur": 0.065, "args": { "External id": 24040,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046033.382, "dur": 0.075, "args": { "External id": 24041,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046033.797, "dur": 0.064, "args": { "External id": 24042,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046034.267, "dur": 0.086, "args": { "External id": 24043,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046034.669, "dur": 0.063, "args": { "External id": 24044,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046035.196, "dur": 0.056, "args": { "External id": 24045,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046035.618, "dur": 0.052, "args": { "External id": 24046,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046036.049, "dur": 0.061, "args": { "External id": 24047,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046036.412, "dur": 0.061, "args": { "External id": 24048,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046036.765, "dur": 0.064, "args": { "External id": 24049,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046037.125, "dur": 0.069, "args": { "External id": 24050,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046037.593, "dur": 0.068, "args": { "External id": 24051,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046038.060, "dur": 0.064, "args": { "External id": 24052,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046038.492, "dur": 0.282, "args": { "External id": 24053,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046039.135, "dur": 0.211, "args": { "External id": 24054,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046039.843, "dur": 0.063, "args": { "External id": 24055,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046040.227, "dur": 0.062, "args": { "External id": 24056,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046040.608, "dur": 0.061, "args": { "External id": 24057,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046040.989, "dur": 0.063, "args": { "External id": 24058,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046041.429, "dur": 0.064, "args": { "External id": 24059,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046041.909, "dur": 0.084, "args": { "External id": 24060,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046042.388, "dur": 0.057, "args": { "External id": 24061,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046042.791, "dur": 0.060, "args": { "External id": 24062,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046043.174, "dur": 0.057, "args": { "External id": 24063,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046043.539, "dur": 0.056, "args": { "External id": 24064,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046064.988, "dur": 0.061, "args": { "External id": 24065,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046066.476, "dur": 0.052, "args": { "External id": 24066,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046066.873, "dur": 0.051, "args": { "External id": 24067,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046067.374, "dur": 0.066, "args": { "External id": 24068,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046067.752, "dur": 0.052, "args": { "External id": 24069,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046068.269, "dur": 0.057, "args": { "External id": 24070,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046068.594, "dur": 0.052, "args": { "External id": 24071,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046069.236, "dur": 0.061, "args": { "External id": 24072,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046069.558, "dur": 0.055, "args": { "External id": 24073,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046070.063, "dur": 0.066, "args": { "External id": 24074,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046070.419, "dur": 0.052, "args": { "External id": 24075,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046070.906, "dur": 0.063, "args": { "External id": 24076,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046071.246, "dur": 0.053, "args": { "External id": 24077,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046071.743, "dur": 0.063, "args": { "External id": 24078,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046072.064, "dur": 0.050, "args": { "External id": 24079,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046072.577, "dur": 0.065, "args": { "External id": 24080,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046072.898, "dur": 0.052, "args": { "External id": 24081,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046073.432, "dur": 0.062, "args": { "External id": 24082,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046073.754, "dur": 0.054, "args": { "External id": 24083,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046074.293, "dur": 0.063, "args": { "External id": 24084,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046074.617, "dur": 0.052, "args": { "External id": 24085,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046075.157, "dur": 0.063, "args": { "External id": 24086,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046075.477, "dur": 0.056, "args": { "External id": 24087,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046076.017, "dur": 0.062, "args": { "External id": 24088,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046076.340, "dur": 0.053, "args": { "External id": 24089,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046076.819, "dur": 0.065, "args": { "External id": 24090,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046077.143, "dur": 0.051, "args": { "External id": 24091,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046077.619, "dur": 0.059, "args": { "External id": 24092,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046077.940, "dur": 0.050, "args": { "External id": 24093,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046078.479, "dur": 0.084, "args": { "External id": 24094,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046078.823, "dur": 0.053, "args": { "External id": 24095,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046079.349, "dur": 0.060, "args": { "External id": 24096,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046079.665, "dur": 0.053, "args": { "External id": 24097,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046080.167, "dur": 0.053, "args": { "External id": 24098,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046080.582, "dur": 0.063, "args": { "External id": 24099,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046081.330, "dur": 0.048, "args": { "External id": 24100,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046081.672, "dur": 0.046, "args": { "External id": 24101,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046082.209, "dur": 0.053, "args": { "External id": 24102,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046082.521, "dur": 0.049, "args": { "External id": 24103,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046083.029, "dur": 0.066, "args": { "External id": 24104,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046083.412, "dur": 0.063, "args": { "External id": 24105,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046083.904, "dur": 0.058, "args": { "External id": 24106,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046084.221, "dur": 0.056, "args": { "External id": 24107,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046084.753, "dur": 0.069, "args": { "External id": 24108,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046085.076, "dur": 0.054, "args": { "External id": 24109,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046085.584, "dur": 0.066, "args": { "External id": 24110,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046085.906, "dur": 0.054, "args": { "External id": 24111,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046086.404, "dur": 0.065, "args": { "External id": 24112,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046086.741, "dur": 0.055, "args": { "External id": 24113,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046087.256, "dur": 0.069, "args": { "External id": 24114,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046087.583, "dur": 0.054, "args": { "External id": 24115,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046088.093, "dur": 0.070, "args": { "External id": 24116,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046088.423, "dur": 0.050, "args": { "External id": 24117,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046095.222, "dur": 0.059, "args": { "External id": 24118,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046095.580, "dur": 0.057, "args": { "External id": 24119,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046096.426, "dur": 0.062, "args": { "External id": 24120,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046096.807, "dur": 0.052, "args": { "External id": 24121,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046097.285, "dur": 0.070, "args": { "External id": 24122,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11473 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046097.597, "dur": 0.054, "args": { "External id": 24123,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046098.146, "dur": 0.061, "args": { "External id": 24124,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046098.451, "dur": 0.062, "args": { "External id": 24125,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046099.103, "dur": 0.066, "args": { "External id": 24126,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046099.414, "dur": 0.049, "args": { "External id": 24127,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046100.062, "dur": 0.062, "args": { "External id": 24128,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046100.367, "dur": 0.055, "args": { "External id": 24129,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046100.958, "dur": 0.066, "args": { "External id": 24130,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046101.269, "dur": 0.049, "args": { "External id": 24131,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046101.766, "dur": 0.067, "args": { "External id": 24132,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046102.080, "dur": 0.049, "args": { "External id": 24133,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046102.715, "dur": 0.066, "args": { "External id": 24134,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046103.031, "dur": 0.064, "args": { "External id": 24135,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046103.558, "dur": 0.050, "args": { "External id": 24136,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046103.859, "dur": 0.047, "args": { "External id": 24137,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046104.502, "dur": 0.063, "args": { "External id": 24138,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046104.816, "dur": 0.077, "args": { "External id": 24139,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046105.467, "dur": 0.068, "args": { "External id": 24140,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046105.780, "dur": 0.059, "args": { "External id": 24141,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046106.298, "dur": 0.062, "args": { "External id": 24142,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046106.608, "dur": 0.054, "args": { "External id": 24143,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046107.260, "dur": 0.062, "args": { "External id": 24144,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046107.568, "dur": 0.049, "args": { "External id": 24145,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046108.240, "dur": 0.064, "args": { "External id": 24146,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046108.548, "dur": 0.055, "args": { "External id": 24147,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046109.161, "dur": 0.068, "args": { "External id": 24148,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046109.483, "dur": 0.052, "args": { "External id": 24149,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046109.994, "dur": 0.066, "args": { "External id": 24150,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046110.315, "dur": 0.066, "args": { "External id": 24151,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046111.041, "dur": 0.066, "args": { "External id": 24152,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046111.363, "dur": 0.052, "args": { "External id": 24153,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11504 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046112.043, "dur": 0.065, "args": { "External id": 24154,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046112.366, "dur": 0.051, "args": { "External id": 24155,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046113.026, "dur": 0.067, "args": { "External id": 24156,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046113.348, "dur": 0.056, "args": { "External id": 24157,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046113.939, "dur": 0.064, "args": { "External id": 24158,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046114.259, "dur": 0.051, "args": { "External id": 24159,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046115.078, "dur": 0.091, "args": { "External id": 24160,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046115.434, "dur": 0.050, "args": { "External id": 24161,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046116.025, "dur": 0.065, "args": { "External id": 24162,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046122.021, "dur": 0.069, "args": { "External id": 24163,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046122.694, "dur": 0.069, "args": { "External id": 24164,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046123.106, "dur": 0.068, "args": { "External id": 24165,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11516 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046123.708, "dur": 0.054, "args": { "External id": 24166,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11517 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046124.024, "dur": 0.056, "args": { "External id": 24167,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046124.494, "dur": 0.060, "args": { "External id": 24168,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046124.814, "dur": 0.050, "args": { "External id": 24169,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046125.243, "dur": 0.064, "args": { "External id": 24170,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046125.652, "dur": 0.067, "args": { "External id": 24171,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046126.290, "dur": 0.065, "args": { "External id": 24172,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046126.615, "dur": 0.053, "args": { "External id": 24173,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046127.226, "dur": 0.051, "args": { "External id": 24174,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046127.535, "dur": 0.053, "args": { "External id": 24175,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046128.107, "dur": 0.061, "args": { "External id": 24176,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046128.428, "dur": 0.053, "args": { "External id": 24177,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046128.940, "dur": 0.061, "args": { "External id": 24178,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046129.259, "dur": 0.053, "args": { "External id": 24179,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046129.754, "dur": 0.062, "args": { "External id": 24180,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046130.084, "dur": 0.056, "args": { "External id": 24181,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046130.580, "dur": 0.061, "args": { "External id": 24182,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046130.898, "dur": 0.054, "args": { "External id": 24183,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046131.527, "dur": 0.064, "args": { "External id": 24184,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046131.848, "dur": 0.076, "args": { "External id": 24185,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11536 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046132.335, "dur": 0.066, "args": { "External id": 24186,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046132.657, "dur": 0.056, "args": { "External id": 24187,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046133.161, "dur": 0.066, "args": { "External id": 24188,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046133.490, "dur": 0.054, "args": { "External id": 24189,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046134.141, "dur": 0.072, "args": { "External id": 24190,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046134.469, "dur": 0.055, "args": { "External id": 24191,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046134.933, "dur": 0.066, "args": { "External id": 24192,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046135.293, "dur": 0.053, "args": { "External id": 24193,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046135.975, "dur": 0.067, "args": { "External id": 24194,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046136.304, "dur": 0.049, "args": { "External id": 24195,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046136.954, "dur": 0.061, "args": { "External id": 24196,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046137.315, "dur": 0.057, "args": { "External id": 24197,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046137.970, "dur": 0.065, "args": { "External id": 24198,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046138.292, "dur": 0.052, "args": { "External id": 24199,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046138.946, "dur": 0.061, "args": { "External id": 24200,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046139.268, "dur": 0.055, "args": { "External id": 24201,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046139.813, "dur": 0.064, "args": { "External id": 24202,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046140.123, "dur": 0.054, "args": { "External id": 24203,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046140.809, "dur": 0.064, "args": { "External id": 24204,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046141.118, "dur": 0.055, "args": { "External id": 24205,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046141.599, "dur": 0.062, "args": { "External id": 24206,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046141.907, "dur": 0.054, "args": { "External id": 24207,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046142.407, "dur": 0.066, "args": { "External id": 24208,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046142.708, "dur": 0.056, "args": { "External id": 24209,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11560 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046143.188, "dur": 0.067, "args": { "External id": 24210,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046143.499, "dur": 0.052, "args": { "External id": 24211,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046144.184, "dur": 0.065, "args": { "External id": 24212,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046144.493, "dur": 0.052, "args": { "External id": 24213,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046145.030, "dur": 0.064, "args": { "External id": 24214,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11565 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046145.353, "dur": 0.051, "args": { "External id": 24215,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046146.068, "dur": 0.052, "args": { "External id": 24216,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046146.661, "dur": 0.070, "args": { "External id": 24217,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046147.319, "dur": 0.068, "args": { "External id": 24218,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046147.646, "dur": 0.053, "args": { "External id": 24219,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046148.198, "dur": 0.061, "args": { "External id": 24220,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11571 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046148.519, "dur": 0.054, "args": { "External id": 24221,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046149.013, "dur": 0.064, "args": { "External id": 24222,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046149.366, "dur": 0.047, "args": { "External id": 24223,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046149.877, "dur": 0.064, "args": { "External id": 24224,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046150.198, "dur": 0.054, "args": { "External id": 24225,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046150.792, "dur": 0.058, "args": { "External id": 24226,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046151.101, "dur": 0.051, "args": { "External id": 24227,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046151.764, "dur": 0.057, "args": { "External id": 24228,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046152.083, "dur": 0.046, "args": { "External id": 24229,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046152.559, "dur": 0.062, "args": { "External id": 24230,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046152.879, "dur": 0.052, "args": { "External id": 24231,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046153.387, "dur": 0.056, "args": { "External id": 24232,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046153.701, "dur": 0.045, "args": { "External id": 24233,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046154.193, "dur": 0.057, "args": { "External id": 24234,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046154.503, "dur": 0.047, "args": { "External id": 24235,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046155.150, "dur": 0.056, "args": { "External id": 24236,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046155.466, "dur": 0.048, "args": { "External id": 24237,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046156.139, "dur": 0.049, "args": { "External id": 24238,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046156.449, "dur": 0.043, "args": { "External id": 24239,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046156.985, "dur": 0.058, "args": { "External id": 24240,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046157.300, "dur": 0.052, "args": { "External id": 24241,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046157.847, "dur": 0.063, "args": { "External id": 24242,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046158.166, "dur": 0.053, "args": { "External id": 24243,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046158.725, "dur": 0.062, "args": { "External id": 24244,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046159.048, "dur": 0.045, "args": { "External id": 24245,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046159.664, "dur": 0.056, "args": { "External id": 24246,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046159.981, "dur": 0.049, "args": { "External id": 24247,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046160.595, "dur": 0.057, "args": { "External id": 24248,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046160.910, "dur": 0.050, "args": { "External id": 24249,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046161.705, "dur": 0.047, "args": { "External id": 24250,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046162.012, "dur": 0.050, "args": { "External id": 24251,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046162.525, "dur": 0.054, "args": { "External id": 24252,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046162.837, "dur": 0.048, "args": { "External id": 24253,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046163.401, "dur": 0.053, "args": { "External id": 24254,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046163.712, "dur": 0.053, "args": { "External id": 24255,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046164.185, "dur": 0.063, "args": { "External id": 24256,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046164.505, "dur": 0.052, "args": { "External id": 24257,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046165.181, "dur": 0.061, "args": { "External id": 24258,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046165.501, "dur": 0.057, "args": { "External id": 24259,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046166.078, "dur": 0.060, "args": { "External id": 24260,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046166.400, "dur": 0.055, "args": { "External id": 24261,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046167.152, "dur": 0.056, "args": { "External id": 24262,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046167.465, "dur": 0.052, "args": { "External id": 24263,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046167.948, "dur": 0.067, "args": { "External id": 24264,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046168.270, "dur": 0.055, "args": { "External id": 24265,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046168.785, "dur": 0.067, "args": { "External id": 24266,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046169.105, "dur": 0.057, "args": { "External id": 24267,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046169.788, "dur": 0.057, "args": { "External id": 24268,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046170.099, "dur": 0.051, "args": { "External id": 24269,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046170.705, "dur": 0.055, "args": { "External id": 24270,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046171.057, "dur": 0.050, "args": { "External id": 24271,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046171.665, "dur": 0.054, "args": { "External id": 24272,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046171.980, "dur": 0.051, "args": { "External id": 24273,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046172.507, "dur": 0.057, "args": { "External id": 24274,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046172.819, "dur": 0.058, "args": { "External id": 24275,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046173.311, "dur": 0.068, "args": { "External id": 24276,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046173.645, "dur": 0.069, "args": { "External id": 24277,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046174.281, "dur": 0.067, "args": { "External id": 24278,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046174.605, "dur": 0.070, "args": { "External id": 24279,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046175.235, "dur": 0.068, "args": { "External id": 24280,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336759, "tid": 1336759, "ts": 1295652046175.553, "dur": 0.056, "args": { "External id": 24281,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_fused_adamw_", "pid": 1336759, "tid": 1336759, "ts": 1295652046724.867, "dur": 3521.325, "args": { "External id": 24282,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "0.0001023488255872064", "0.90000000000000002", "0.94999999999999996", "0.10000000000000001", "1.0000000000000001e-15", "False", "False", "", ""], "Input type": ["TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 11633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_fused_adamw_", "pid": 1336759, "tid": 1336759, "ts": 1295652049699.980, "dur": 380.896, "args": { "External id": 24283,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "0.0001023488255872064", "0.90000000000000002", "0.94999999999999996", "0.10000000000000001", "1.0000000000000001e-15", "False", "False", "", ""], "Input type": ["TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 11634 } }, { "name": "process_name", "ph": "M", "ts": 1295649886156.686, "pid": 1336759, "tid": 0, "args": { "name": "python3.12" } }, { "name": "process_labels", "ph": "M", "ts": 1295649886156.686, "pid": 1336759, "tid": 0, "args": { "labels": "CPU" } }, { "name": "process_sort_index", "ph": "M", "ts": 1295649886156.686, "pid": 1336759, "tid": 0, "args": { "sort_index": 1336759 } }, { "name": "thread_name", "ph": "M", "ts": 1295649886156.686, "pid": 1336759, "tid": 1381173, "args": { "name": "thread 1381173 (pt_autograd_6)" } }, { "name": "thread_sort_index", "ph": "M", "ts": 1295649886156.686, "pid": 1336759, "tid": 1381173, "args": { "sort_index": 1381173 } }, { "name": "thread_name", "ph": "M", "ts": 1295649886156.686, "pid": 1336759, "tid": 1336759, "args": { "name": "thread 1336759 (python3.12)" } }, { "name": "thread_sort_index", "ph": "M", "ts": 1295649886156.686, "pid": 1336759, "tid": 1336759, "args": { "sort_index": 1336759 } }, { "name": "thread_name", "ph": "M", "ts": 1295649886156.686, "pid": 1336759, "tid": 1381173, "args": { "name": "thread 1381173 (python3.12)" } }, { "name": "thread_sort_index", "ph": "M", "ts": 1295649886156.686, "pid": 1336759, "tid": 1381173, "args": { "sort_index": 1381173 } }, { "ph": "X", "cat": "Trace", "ts": 1295649886086.788, "dur": 2165941.161, "pid": "Spans", "tid": "PyTorch Profiler", "name": "PyTorch Profiler (0)", "args": { "Op count": 0 } }, { "name": "process_sort_index", "ph": "M", "ts": 1295649886086.788, "pid": "Spans", "tid": 0, "args": { "sort_index": 536870912 } }, { "name": "Iteration Start: PyTorch Profiler", "ph": "i", "s": "g", "pid": "Traces", "tid": "Trace PyTorch Profiler", "ts": 1295649886086.788 }, { "name": "Record Window End", "ph": "i", "s": "g", "pid": "", "tid": "", "ts": 1295652102719.195 } ], "traceName": "exp/mtp.1B.batch16.seqlen4096.context4096.warmup2000.update1.steps200000.lr2e-4.cosine/profile_trace/iteration_1024/rank6_trace.json", "displayTimeUnit": "ms", "baseTimeNanoseconds": 1751410836000000000 }